{ "best_metric": null, "best_model_checkpoint": null, "epoch": 1.0, "global_step": 33195, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, "learning_rate": 5.02008032128514e-09, "loss": 2.4155, "step": 1 }, { "epoch": 0.0, "learning_rate": 1.004016064257028e-08, "loss": 2.5479, "step": 2 }, { "epoch": 0.0, "learning_rate": 1.5060240963855425e-08, "loss": 2.5901, "step": 3 }, { "epoch": 0.0, "learning_rate": 2.008032128514056e-08, "loss": 2.7227, "step": 4 }, { "epoch": 0.0, "learning_rate": 2.5100401606425703e-08, "loss": 2.562, "step": 5 }, { "epoch": 0.0, "learning_rate": 3.012048192771085e-08, "loss": 2.8206, "step": 6 }, { "epoch": 0.0, "learning_rate": 3.5140562248995985e-08, "loss": 2.6187, "step": 7 }, { "epoch": 0.0, "learning_rate": 4.016064257028112e-08, "loss": 2.5796, "step": 8 }, { "epoch": 0.0, "learning_rate": 4.5180722891566264e-08, "loss": 2.5427, "step": 9 }, { "epoch": 0.0, "learning_rate": 5.0200803212851406e-08, "loss": 2.6848, "step": 10 }, { "epoch": 0.0, "learning_rate": 5.522088353413655e-08, "loss": 2.696, "step": 11 }, { "epoch": 0.0, "learning_rate": 6.02409638554217e-08, "loss": 2.8428, "step": 12 }, { "epoch": 0.0, "learning_rate": 6.526104417670683e-08, "loss": 2.7173, "step": 13 }, { "epoch": 0.0, "learning_rate": 7.028112449799197e-08, "loss": 2.4712, "step": 14 }, { "epoch": 0.0, "learning_rate": 7.530120481927711e-08, "loss": 2.3896, "step": 15 }, { "epoch": 0.0, "learning_rate": 8.032128514056224e-08, "loss": 2.5011, "step": 16 }, { "epoch": 0.0, "learning_rate": 8.53413654618474e-08, "loss": 2.7654, "step": 17 }, { "epoch": 0.0, "learning_rate": 9.036144578313253e-08, "loss": 2.8972, "step": 18 }, { "epoch": 0.0, "learning_rate": 9.538152610441768e-08, "loss": 2.7473, "step": 19 }, { "epoch": 0.0, "learning_rate": 1.0040160642570281e-07, "loss": 2.4688, "step": 20 }, { "epoch": 0.0, "learning_rate": 1.0542168674698796e-07, "loss": 2.4634, "step": 21 }, { "epoch": 0.0, "learning_rate": 1.104417670682731e-07, "loss": 2.5532, "step": 22 }, { "epoch": 0.0, "learning_rate": 1.1546184738955824e-07, "loss": 2.6824, "step": 23 }, { "epoch": 0.0, "learning_rate": 1.204819277108434e-07, "loss": 2.5073, "step": 24 }, { "epoch": 0.0, "learning_rate": 1.2550200803212853e-07, "loss": 2.9604, "step": 25 }, { "epoch": 0.0, "learning_rate": 1.3052208835341366e-07, "loss": 2.2404, "step": 26 }, { "epoch": 0.0, "learning_rate": 1.355421686746988e-07, "loss": 2.3335, "step": 27 }, { "epoch": 0.0, "learning_rate": 1.4056224899598394e-07, "loss": 2.2633, "step": 28 }, { "epoch": 0.0, "learning_rate": 1.455823293172691e-07, "loss": 2.1682, "step": 29 }, { "epoch": 0.0, "learning_rate": 1.5060240963855423e-07, "loss": 2.259, "step": 30 }, { "epoch": 0.0, "learning_rate": 1.5562248995983936e-07, "loss": 2.3323, "step": 31 }, { "epoch": 0.0, "learning_rate": 1.6064257028112448e-07, "loss": 2.1294, "step": 32 }, { "epoch": 0.0, "learning_rate": 1.6566265060240967e-07, "loss": 1.9897, "step": 33 }, { "epoch": 0.0, "learning_rate": 1.706827309236948e-07, "loss": 1.9979, "step": 34 }, { "epoch": 0.0, "learning_rate": 1.7570281124497993e-07, "loss": 2.1283, "step": 35 }, { "epoch": 0.0, "learning_rate": 1.8072289156626505e-07, "loss": 2.0967, "step": 36 }, { "epoch": 0.0, "learning_rate": 1.857429718875502e-07, "loss": 2.1406, "step": 37 }, { "epoch": 0.0, "learning_rate": 1.9076305220883537e-07, "loss": 2.1028, "step": 38 }, { "epoch": 0.0, "learning_rate": 1.957831325301205e-07, "loss": 1.8724, "step": 39 }, { "epoch": 0.0, "learning_rate": 2.0080321285140563e-07, "loss": 1.9177, "step": 40 }, { "epoch": 0.0, "learning_rate": 2.0582329317269078e-07, "loss": 1.9093, "step": 41 }, { "epoch": 0.0, "learning_rate": 2.108433734939759e-07, "loss": 1.8374, "step": 42 }, { "epoch": 0.0, "learning_rate": 2.1586345381526107e-07, "loss": 1.8722, "step": 43 }, { "epoch": 0.0, "learning_rate": 2.208835341365462e-07, "loss": 1.8756, "step": 44 }, { "epoch": 0.0, "learning_rate": 2.2590361445783135e-07, "loss": 1.7311, "step": 45 }, { "epoch": 0.0, "learning_rate": 2.3092369477911648e-07, "loss": 1.7499, "step": 46 }, { "epoch": 0.0, "learning_rate": 2.359437751004016e-07, "loss": 1.6642, "step": 47 }, { "epoch": 0.0, "learning_rate": 2.409638554216868e-07, "loss": 1.7401, "step": 48 }, { "epoch": 0.0, "learning_rate": 2.459839357429719e-07, "loss": 1.7141, "step": 49 }, { "epoch": 0.0, "learning_rate": 2.5100401606425705e-07, "loss": 1.8718, "step": 50 }, { "epoch": 0.0, "learning_rate": 2.560240963855422e-07, "loss": 1.6438, "step": 51 }, { "epoch": 0.0, "learning_rate": 2.610441767068273e-07, "loss": 1.5062, "step": 52 }, { "epoch": 0.0, "learning_rate": 2.6606425702811247e-07, "loss": 1.6093, "step": 53 }, { "epoch": 0.0, "learning_rate": 2.710843373493976e-07, "loss": 1.5728, "step": 54 }, { "epoch": 0.0, "learning_rate": 2.761044176706828e-07, "loss": 1.6921, "step": 55 }, { "epoch": 0.0, "learning_rate": 2.811244979919679e-07, "loss": 1.7946, "step": 56 }, { "epoch": 0.0, "learning_rate": 2.8614457831325304e-07, "loss": 1.604, "step": 57 }, { "epoch": 0.0, "learning_rate": 2.911646586345382e-07, "loss": 1.5355, "step": 58 }, { "epoch": 0.0, "learning_rate": 2.9618473895582335e-07, "loss": 1.5288, "step": 59 }, { "epoch": 0.0, "learning_rate": 3.0120481927710845e-07, "loss": 1.5636, "step": 60 }, { "epoch": 0.0, "learning_rate": 3.062248995983936e-07, "loss": 1.5856, "step": 61 }, { "epoch": 0.0, "learning_rate": 3.112449799196787e-07, "loss": 1.5604, "step": 62 }, { "epoch": 0.0, "learning_rate": 3.1626506024096387e-07, "loss": 1.537, "step": 63 }, { "epoch": 0.0, "learning_rate": 3.2128514056224897e-07, "loss": 1.5649, "step": 64 }, { "epoch": 0.0, "learning_rate": 3.263052208835342e-07, "loss": 1.5441, "step": 65 }, { "epoch": 0.0, "learning_rate": 3.3132530120481933e-07, "loss": 1.4779, "step": 66 }, { "epoch": 0.0, "learning_rate": 3.363453815261045e-07, "loss": 1.5302, "step": 67 }, { "epoch": 0.0, "learning_rate": 3.413654618473896e-07, "loss": 1.6504, "step": 68 }, { "epoch": 0.0, "learning_rate": 3.4638554216867475e-07, "loss": 1.5765, "step": 69 }, { "epoch": 0.0, "learning_rate": 3.5140562248995985e-07, "loss": 1.4261, "step": 70 }, { "epoch": 0.0, "learning_rate": 3.56425702811245e-07, "loss": 1.5109, "step": 71 }, { "epoch": 0.0, "learning_rate": 3.614457831325301e-07, "loss": 1.4829, "step": 72 }, { "epoch": 0.0, "learning_rate": 3.6646586345381527e-07, "loss": 1.3701, "step": 73 }, { "epoch": 0.0, "learning_rate": 3.714859437751004e-07, "loss": 1.5048, "step": 74 }, { "epoch": 0.0, "learning_rate": 3.7650602409638563e-07, "loss": 1.5005, "step": 75 }, { "epoch": 0.0, "learning_rate": 3.8152610441767073e-07, "loss": 1.4692, "step": 76 }, { "epoch": 0.0, "learning_rate": 3.865461847389559e-07, "loss": 1.4747, "step": 77 }, { "epoch": 0.0, "learning_rate": 3.91566265060241e-07, "loss": 1.478, "step": 78 }, { "epoch": 0.0, "learning_rate": 3.9658634538152615e-07, "loss": 1.4521, "step": 79 }, { "epoch": 0.0, "learning_rate": 4.0160642570281125e-07, "loss": 1.4882, "step": 80 }, { "epoch": 0.0, "learning_rate": 4.066265060240964e-07, "loss": 1.5562, "step": 81 }, { "epoch": 0.0, "learning_rate": 4.1164658634538156e-07, "loss": 1.458, "step": 82 }, { "epoch": 0.0, "learning_rate": 4.1666666666666667e-07, "loss": 1.4043, "step": 83 }, { "epoch": 0.0, "learning_rate": 4.216867469879518e-07, "loss": 1.3, "step": 84 }, { "epoch": 0.0, "learning_rate": 4.2670682730923703e-07, "loss": 1.4576, "step": 85 }, { "epoch": 0.0, "learning_rate": 4.3172690763052213e-07, "loss": 1.4498, "step": 86 }, { "epoch": 0.0, "learning_rate": 4.367469879518073e-07, "loss": 1.506, "step": 87 }, { "epoch": 0.0, "learning_rate": 4.417670682730924e-07, "loss": 1.3972, "step": 88 }, { "epoch": 0.0, "learning_rate": 4.4678714859437755e-07, "loss": 1.4575, "step": 89 }, { "epoch": 0.0, "learning_rate": 4.518072289156627e-07, "loss": 1.4003, "step": 90 }, { "epoch": 0.0, "learning_rate": 4.568273092369478e-07, "loss": 1.2924, "step": 91 }, { "epoch": 0.0, "learning_rate": 4.6184738955823296e-07, "loss": 1.3619, "step": 92 }, { "epoch": 0.0, "learning_rate": 4.6686746987951807e-07, "loss": 1.5461, "step": 93 }, { "epoch": 0.0, "learning_rate": 4.718875502008032e-07, "loss": 1.572, "step": 94 }, { "epoch": 0.0, "learning_rate": 4.769076305220884e-07, "loss": 1.3987, "step": 95 }, { "epoch": 0.0, "learning_rate": 4.819277108433736e-07, "loss": 1.4033, "step": 96 }, { "epoch": 0.0, "learning_rate": 4.869477911646587e-07, "loss": 1.3839, "step": 97 }, { "epoch": 0.0, "learning_rate": 4.919678714859438e-07, "loss": 1.3643, "step": 98 }, { "epoch": 0.0, "learning_rate": 4.96987951807229e-07, "loss": 1.2183, "step": 99 }, { "epoch": 0.0, "learning_rate": 5.020080321285141e-07, "loss": 1.577, "step": 100 }, { "epoch": 0.0, "learning_rate": 5.070281124497993e-07, "loss": 1.3492, "step": 101 }, { "epoch": 0.0, "learning_rate": 5.120481927710844e-07, "loss": 1.267, "step": 102 }, { "epoch": 0.0, "learning_rate": 5.170682730923695e-07, "loss": 1.3755, "step": 103 }, { "epoch": 0.0, "learning_rate": 5.220883534136546e-07, "loss": 1.3232, "step": 104 }, { "epoch": 0.0, "learning_rate": 5.271084337349399e-07, "loss": 1.2084, "step": 105 }, { "epoch": 0.0, "learning_rate": 5.321285140562249e-07, "loss": 1.4172, "step": 106 }, { "epoch": 0.0, "learning_rate": 5.371485943775101e-07, "loss": 1.3521, "step": 107 }, { "epoch": 0.0, "learning_rate": 5.421686746987952e-07, "loss": 1.4406, "step": 108 }, { "epoch": 0.0, "learning_rate": 5.471887550200804e-07, "loss": 1.3184, "step": 109 }, { "epoch": 0.0, "learning_rate": 5.522088353413656e-07, "loss": 1.204, "step": 110 }, { "epoch": 0.0, "learning_rate": 5.572289156626506e-07, "loss": 1.3633, "step": 111 }, { "epoch": 0.0, "learning_rate": 5.622489959839358e-07, "loss": 1.3525, "step": 112 }, { "epoch": 0.0, "learning_rate": 5.672690763052209e-07, "loss": 1.2325, "step": 113 }, { "epoch": 0.0, "learning_rate": 5.722891566265061e-07, "loss": 1.2248, "step": 114 }, { "epoch": 0.0, "learning_rate": 5.773092369477912e-07, "loss": 1.2024, "step": 115 }, { "epoch": 0.0, "learning_rate": 5.823293172690764e-07, "loss": 1.3489, "step": 116 }, { "epoch": 0.0, "learning_rate": 5.873493975903615e-07, "loss": 1.3716, "step": 117 }, { "epoch": 0.0, "learning_rate": 5.923694779116467e-07, "loss": 1.2109, "step": 118 }, { "epoch": 0.0, "learning_rate": 5.973895582329317e-07, "loss": 1.2858, "step": 119 }, { "epoch": 0.0, "learning_rate": 6.024096385542169e-07, "loss": 1.3219, "step": 120 }, { "epoch": 0.0, "learning_rate": 6.074297188755021e-07, "loss": 1.2228, "step": 121 }, { "epoch": 0.0, "learning_rate": 6.124497991967872e-07, "loss": 1.3014, "step": 122 }, { "epoch": 0.0, "learning_rate": 6.174698795180723e-07, "loss": 1.2285, "step": 123 }, { "epoch": 0.0, "learning_rate": 6.224899598393574e-07, "loss": 1.1723, "step": 124 }, { "epoch": 0.0, "learning_rate": 6.275100401606427e-07, "loss": 1.4469, "step": 125 }, { "epoch": 0.0, "learning_rate": 6.325301204819277e-07, "loss": 1.2423, "step": 126 }, { "epoch": 0.0, "learning_rate": 6.375502008032129e-07, "loss": 1.2848, "step": 127 }, { "epoch": 0.0, "learning_rate": 6.425702811244979e-07, "loss": 1.3463, "step": 128 }, { "epoch": 0.0, "learning_rate": 6.475903614457832e-07, "loss": 1.3191, "step": 129 }, { "epoch": 0.0, "learning_rate": 6.526104417670684e-07, "loss": 1.1904, "step": 130 }, { "epoch": 0.0, "learning_rate": 6.576305220883534e-07, "loss": 1.4174, "step": 131 }, { "epoch": 0.0, "learning_rate": 6.626506024096387e-07, "loss": 1.135, "step": 132 }, { "epoch": 0.0, "learning_rate": 6.676706827309237e-07, "loss": 1.2214, "step": 133 }, { "epoch": 0.0, "learning_rate": 6.72690763052209e-07, "loss": 1.22, "step": 134 }, { "epoch": 0.0, "learning_rate": 6.77710843373494e-07, "loss": 1.2402, "step": 135 }, { "epoch": 0.0, "learning_rate": 6.827309236947792e-07, "loss": 1.4093, "step": 136 }, { "epoch": 0.0, "learning_rate": 6.877510040160642e-07, "loss": 1.4006, "step": 137 }, { "epoch": 0.0, "learning_rate": 6.927710843373495e-07, "loss": 1.1896, "step": 138 }, { "epoch": 0.0, "learning_rate": 6.977911646586345e-07, "loss": 1.2017, "step": 139 }, { "epoch": 0.0, "learning_rate": 7.028112449799197e-07, "loss": 1.0653, "step": 140 }, { "epoch": 0.0, "learning_rate": 7.07831325301205e-07, "loss": 1.3293, "step": 141 }, { "epoch": 0.0, "learning_rate": 7.1285140562249e-07, "loss": 1.3657, "step": 142 }, { "epoch": 0.0, "learning_rate": 7.178714859437752e-07, "loss": 1.1977, "step": 143 }, { "epoch": 0.0, "learning_rate": 7.228915662650602e-07, "loss": 1.3591, "step": 144 }, { "epoch": 0.0, "learning_rate": 7.279116465863455e-07, "loss": 1.2922, "step": 145 }, { "epoch": 0.0, "learning_rate": 7.329317269076305e-07, "loss": 1.3021, "step": 146 }, { "epoch": 0.0, "learning_rate": 7.379518072289157e-07, "loss": 1.2247, "step": 147 }, { "epoch": 0.0, "learning_rate": 7.429718875502008e-07, "loss": 1.2728, "step": 148 }, { "epoch": 0.0, "learning_rate": 7.47991967871486e-07, "loss": 1.2058, "step": 149 }, { "epoch": 0.0, "learning_rate": 7.530120481927713e-07, "loss": 1.2694, "step": 150 }, { "epoch": 0.0, "learning_rate": 7.580321285140563e-07, "loss": 1.2841, "step": 151 }, { "epoch": 0.0, "learning_rate": 7.630522088353415e-07, "loss": 1.2338, "step": 152 }, { "epoch": 0.0, "learning_rate": 7.680722891566265e-07, "loss": 1.1969, "step": 153 }, { "epoch": 0.0, "learning_rate": 7.730923694779118e-07, "loss": 1.1537, "step": 154 }, { "epoch": 0.0, "learning_rate": 7.781124497991968e-07, "loss": 1.2491, "step": 155 }, { "epoch": 0.0, "learning_rate": 7.83132530120482e-07, "loss": 1.2469, "step": 156 }, { "epoch": 0.0, "learning_rate": 7.88152610441767e-07, "loss": 1.302, "step": 157 }, { "epoch": 0.0, "learning_rate": 7.931726907630523e-07, "loss": 1.1821, "step": 158 }, { "epoch": 0.0, "learning_rate": 7.981927710843373e-07, "loss": 1.1961, "step": 159 }, { "epoch": 0.0, "learning_rate": 8.032128514056225e-07, "loss": 1.2323, "step": 160 }, { "epoch": 0.0, "learning_rate": 8.082329317269078e-07, "loss": 1.1526, "step": 161 }, { "epoch": 0.0, "learning_rate": 8.132530120481928e-07, "loss": 1.2313, "step": 162 }, { "epoch": 0.0, "learning_rate": 8.182730923694781e-07, "loss": 1.2028, "step": 163 }, { "epoch": 0.0, "learning_rate": 8.232931726907631e-07, "loss": 1.4237, "step": 164 }, { "epoch": 0.0, "learning_rate": 8.283132530120483e-07, "loss": 1.1572, "step": 165 }, { "epoch": 0.01, "learning_rate": 8.333333333333333e-07, "loss": 1.2743, "step": 166 }, { "epoch": 0.01, "learning_rate": 8.383534136546186e-07, "loss": 1.1199, "step": 167 }, { "epoch": 0.01, "learning_rate": 8.433734939759036e-07, "loss": 1.2889, "step": 168 }, { "epoch": 0.01, "learning_rate": 8.483935742971888e-07, "loss": 1.281, "step": 169 }, { "epoch": 0.01, "learning_rate": 8.534136546184741e-07, "loss": 1.2972, "step": 170 }, { "epoch": 0.01, "learning_rate": 8.584337349397591e-07, "loss": 1.2623, "step": 171 }, { "epoch": 0.01, "learning_rate": 8.634538152610443e-07, "loss": 1.2565, "step": 172 }, { "epoch": 0.01, "learning_rate": 8.684738955823293e-07, "loss": 1.2812, "step": 173 }, { "epoch": 0.01, "learning_rate": 8.734939759036146e-07, "loss": 1.2247, "step": 174 }, { "epoch": 0.01, "learning_rate": 8.785140562248996e-07, "loss": 1.3257, "step": 175 }, { "epoch": 0.01, "learning_rate": 8.835341365461848e-07, "loss": 1.3358, "step": 176 }, { "epoch": 0.01, "learning_rate": 8.885542168674699e-07, "loss": 1.3177, "step": 177 }, { "epoch": 0.01, "learning_rate": 8.935742971887551e-07, "loss": 1.2667, "step": 178 }, { "epoch": 0.01, "learning_rate": 8.985943775100401e-07, "loss": 1.2096, "step": 179 }, { "epoch": 0.01, "learning_rate": 9.036144578313254e-07, "loss": 1.2301, "step": 180 }, { "epoch": 0.01, "learning_rate": 9.086345381526106e-07, "loss": 1.2493, "step": 181 }, { "epoch": 0.01, "learning_rate": 9.136546184738956e-07, "loss": 1.1779, "step": 182 }, { "epoch": 0.01, "learning_rate": 9.186746987951809e-07, "loss": 1.1583, "step": 183 }, { "epoch": 0.01, "learning_rate": 9.236947791164659e-07, "loss": 1.2643, "step": 184 }, { "epoch": 0.01, "learning_rate": 9.287148594377511e-07, "loss": 1.1299, "step": 185 }, { "epoch": 0.01, "learning_rate": 9.337349397590361e-07, "loss": 1.2518, "step": 186 }, { "epoch": 0.01, "learning_rate": 9.387550200803214e-07, "loss": 1.2502, "step": 187 }, { "epoch": 0.01, "learning_rate": 9.437751004016064e-07, "loss": 1.1628, "step": 188 }, { "epoch": 0.01, "learning_rate": 9.487951807228916e-07, "loss": 1.2582, "step": 189 }, { "epoch": 0.01, "learning_rate": 9.538152610441769e-07, "loss": 1.2424, "step": 190 }, { "epoch": 0.01, "learning_rate": 9.58835341365462e-07, "loss": 1.2504, "step": 191 }, { "epoch": 0.01, "learning_rate": 9.638554216867472e-07, "loss": 1.2153, "step": 192 }, { "epoch": 0.01, "learning_rate": 9.688755020080322e-07, "loss": 1.3019, "step": 193 }, { "epoch": 0.01, "learning_rate": 9.738955823293175e-07, "loss": 1.1819, "step": 194 }, { "epoch": 0.01, "learning_rate": 9.789156626506025e-07, "loss": 1.2485, "step": 195 }, { "epoch": 0.01, "learning_rate": 9.839357429718876e-07, "loss": 1.272, "step": 196 }, { "epoch": 0.01, "learning_rate": 9.889558232931726e-07, "loss": 1.257, "step": 197 }, { "epoch": 0.01, "learning_rate": 9.93975903614458e-07, "loss": 1.2561, "step": 198 }, { "epoch": 0.01, "learning_rate": 9.98995983935743e-07, "loss": 1.1905, "step": 199 }, { "epoch": 0.01, "learning_rate": 1.0040160642570282e-06, "loss": 1.1709, "step": 200 }, { "epoch": 0.01, "learning_rate": 1.0090361445783135e-06, "loss": 1.3597, "step": 201 }, { "epoch": 0.01, "learning_rate": 1.0140562248995985e-06, "loss": 1.1508, "step": 202 }, { "epoch": 0.01, "learning_rate": 1.0190763052208836e-06, "loss": 1.2331, "step": 203 }, { "epoch": 0.01, "learning_rate": 1.0240963855421688e-06, "loss": 1.2838, "step": 204 }, { "epoch": 0.01, "learning_rate": 1.0291164658634539e-06, "loss": 1.1999, "step": 205 }, { "epoch": 0.01, "learning_rate": 1.034136546184739e-06, "loss": 1.1559, "step": 206 }, { "epoch": 0.01, "learning_rate": 1.0391566265060242e-06, "loss": 1.2174, "step": 207 }, { "epoch": 0.01, "learning_rate": 1.0441767068273092e-06, "loss": 1.2364, "step": 208 }, { "epoch": 0.01, "learning_rate": 1.0491967871485945e-06, "loss": 1.1697, "step": 209 }, { "epoch": 0.01, "learning_rate": 1.0542168674698798e-06, "loss": 1.1979, "step": 210 }, { "epoch": 0.01, "learning_rate": 1.0592369477911648e-06, "loss": 1.1682, "step": 211 }, { "epoch": 0.01, "learning_rate": 1.0642570281124499e-06, "loss": 1.2386, "step": 212 }, { "epoch": 0.01, "learning_rate": 1.069277108433735e-06, "loss": 1.2647, "step": 213 }, { "epoch": 0.01, "learning_rate": 1.0742971887550202e-06, "loss": 1.2115, "step": 214 }, { "epoch": 0.01, "learning_rate": 1.0793172690763052e-06, "loss": 1.1761, "step": 215 }, { "epoch": 0.01, "learning_rate": 1.0843373493975905e-06, "loss": 1.1451, "step": 216 }, { "epoch": 0.01, "learning_rate": 1.0893574297188755e-06, "loss": 1.1812, "step": 217 }, { "epoch": 0.01, "learning_rate": 1.0943775100401608e-06, "loss": 1.2293, "step": 218 }, { "epoch": 0.01, "learning_rate": 1.0993975903614459e-06, "loss": 1.0367, "step": 219 }, { "epoch": 0.01, "learning_rate": 1.1044176706827311e-06, "loss": 1.2104, "step": 220 }, { "epoch": 0.01, "learning_rate": 1.1094377510040162e-06, "loss": 1.2677, "step": 221 }, { "epoch": 0.01, "learning_rate": 1.1144578313253012e-06, "loss": 1.2855, "step": 222 }, { "epoch": 0.01, "learning_rate": 1.1194779116465865e-06, "loss": 1.2546, "step": 223 }, { "epoch": 0.01, "learning_rate": 1.1244979919678715e-06, "loss": 1.2147, "step": 224 }, { "epoch": 0.01, "learning_rate": 1.1295180722891568e-06, "loss": 1.27, "step": 225 }, { "epoch": 0.01, "learning_rate": 1.1345381526104418e-06, "loss": 1.3188, "step": 226 }, { "epoch": 0.01, "learning_rate": 1.139558232931727e-06, "loss": 1.1672, "step": 227 }, { "epoch": 0.01, "learning_rate": 1.1445783132530121e-06, "loss": 1.2582, "step": 228 }, { "epoch": 0.01, "learning_rate": 1.1495983935742972e-06, "loss": 1.2856, "step": 229 }, { "epoch": 0.01, "learning_rate": 1.1546184738955825e-06, "loss": 1.1485, "step": 230 }, { "epoch": 0.01, "learning_rate": 1.1596385542168675e-06, "loss": 1.3519, "step": 231 }, { "epoch": 0.01, "learning_rate": 1.1646586345381528e-06, "loss": 1.1606, "step": 232 }, { "epoch": 0.01, "learning_rate": 1.1696787148594378e-06, "loss": 1.2258, "step": 233 }, { "epoch": 0.01, "learning_rate": 1.174698795180723e-06, "loss": 1.2924, "step": 234 }, { "epoch": 0.01, "learning_rate": 1.1797188755020081e-06, "loss": 1.1928, "step": 235 }, { "epoch": 0.01, "learning_rate": 1.1847389558232934e-06, "loss": 1.1589, "step": 236 }, { "epoch": 0.01, "learning_rate": 1.1897590361445784e-06, "loss": 1.2564, "step": 237 }, { "epoch": 0.01, "learning_rate": 1.1947791164658635e-06, "loss": 1.2231, "step": 238 }, { "epoch": 0.01, "learning_rate": 1.1997991967871485e-06, "loss": 1.2137, "step": 239 }, { "epoch": 0.01, "learning_rate": 1.2048192771084338e-06, "loss": 1.2245, "step": 240 }, { "epoch": 0.01, "learning_rate": 1.209839357429719e-06, "loss": 1.223, "step": 241 }, { "epoch": 0.01, "learning_rate": 1.2148594377510041e-06, "loss": 1.1696, "step": 242 }, { "epoch": 0.01, "learning_rate": 1.2198795180722894e-06, "loss": 1.1564, "step": 243 }, { "epoch": 0.01, "learning_rate": 1.2248995983935744e-06, "loss": 1.2292, "step": 244 }, { "epoch": 0.01, "learning_rate": 1.2299196787148595e-06, "loss": 1.2714, "step": 245 }, { "epoch": 0.01, "learning_rate": 1.2349397590361445e-06, "loss": 1.0826, "step": 246 }, { "epoch": 0.01, "learning_rate": 1.2399598393574298e-06, "loss": 1.2193, "step": 247 }, { "epoch": 0.01, "learning_rate": 1.2449799196787148e-06, "loss": 1.1747, "step": 248 }, { "epoch": 0.01, "learning_rate": 1.25e-06, "loss": 1.2124, "step": 249 }, { "epoch": 0.01, "learning_rate": 1.2550200803212854e-06, "loss": 1.2631, "step": 250 }, { "epoch": 0.01, "learning_rate": 1.2600401606425704e-06, "loss": 1.2247, "step": 251 }, { "epoch": 0.01, "learning_rate": 1.2650602409638555e-06, "loss": 1.215, "step": 252 }, { "epoch": 0.01, "learning_rate": 1.2700803212851407e-06, "loss": 1.2162, "step": 253 }, { "epoch": 0.01, "learning_rate": 1.2751004016064258e-06, "loss": 1.3363, "step": 254 }, { "epoch": 0.01, "learning_rate": 1.280120481927711e-06, "loss": 1.2678, "step": 255 }, { "epoch": 0.01, "learning_rate": 1.2851405622489959e-06, "loss": 1.2551, "step": 256 }, { "epoch": 0.01, "learning_rate": 1.2901606425702811e-06, "loss": 1.2805, "step": 257 }, { "epoch": 0.01, "learning_rate": 1.2951807228915664e-06, "loss": 1.2622, "step": 258 }, { "epoch": 0.01, "learning_rate": 1.3002008032128517e-06, "loss": 1.1876, "step": 259 }, { "epoch": 0.01, "learning_rate": 1.3052208835341367e-06, "loss": 1.2773, "step": 260 }, { "epoch": 0.01, "learning_rate": 1.3102409638554218e-06, "loss": 1.2065, "step": 261 }, { "epoch": 0.01, "learning_rate": 1.3152610441767068e-06, "loss": 1.256, "step": 262 }, { "epoch": 0.01, "learning_rate": 1.320281124497992e-06, "loss": 1.2609, "step": 263 }, { "epoch": 0.01, "learning_rate": 1.3253012048192773e-06, "loss": 1.152, "step": 264 }, { "epoch": 0.01, "learning_rate": 1.3303212851405622e-06, "loss": 1.1904, "step": 265 }, { "epoch": 0.01, "learning_rate": 1.3353413654618474e-06, "loss": 1.095, "step": 266 }, { "epoch": 0.01, "learning_rate": 1.3403614457831327e-06, "loss": 1.0817, "step": 267 }, { "epoch": 0.01, "learning_rate": 1.345381526104418e-06, "loss": 1.2191, "step": 268 }, { "epoch": 0.01, "learning_rate": 1.350401606425703e-06, "loss": 1.257, "step": 269 }, { "epoch": 0.01, "learning_rate": 1.355421686746988e-06, "loss": 1.2578, "step": 270 }, { "epoch": 0.01, "learning_rate": 1.3604417670682731e-06, "loss": 1.0878, "step": 271 }, { "epoch": 0.01, "learning_rate": 1.3654618473895584e-06, "loss": 1.1508, "step": 272 }, { "epoch": 0.01, "learning_rate": 1.3704819277108436e-06, "loss": 1.141, "step": 273 }, { "epoch": 0.01, "learning_rate": 1.3755020080321285e-06, "loss": 1.3189, "step": 274 }, { "epoch": 0.01, "learning_rate": 1.3805220883534137e-06, "loss": 1.3882, "step": 275 }, { "epoch": 0.01, "learning_rate": 1.385542168674699e-06, "loss": 1.2175, "step": 276 }, { "epoch": 0.01, "learning_rate": 1.390562248995984e-06, "loss": 1.2643, "step": 277 }, { "epoch": 0.01, "learning_rate": 1.395582329317269e-06, "loss": 1.1188, "step": 278 }, { "epoch": 0.01, "learning_rate": 1.4006024096385544e-06, "loss": 1.1735, "step": 279 }, { "epoch": 0.01, "learning_rate": 1.4056224899598394e-06, "loss": 1.2126, "step": 280 }, { "epoch": 0.01, "learning_rate": 1.4106425702811247e-06, "loss": 1.1843, "step": 281 }, { "epoch": 0.01, "learning_rate": 1.41566265060241e-06, "loss": 1.1759, "step": 282 }, { "epoch": 0.01, "learning_rate": 1.4206827309236948e-06, "loss": 1.2499, "step": 283 }, { "epoch": 0.01, "learning_rate": 1.42570281124498e-06, "loss": 1.2172, "step": 284 }, { "epoch": 0.01, "learning_rate": 1.4307228915662653e-06, "loss": 1.1891, "step": 285 }, { "epoch": 0.01, "learning_rate": 1.4357429718875503e-06, "loss": 1.2121, "step": 286 }, { "epoch": 0.01, "learning_rate": 1.4407630522088354e-06, "loss": 1.2007, "step": 287 }, { "epoch": 0.01, "learning_rate": 1.4457831325301204e-06, "loss": 1.3286, "step": 288 }, { "epoch": 0.01, "learning_rate": 1.4508032128514057e-06, "loss": 1.1889, "step": 289 }, { "epoch": 0.01, "learning_rate": 1.455823293172691e-06, "loss": 1.1826, "step": 290 }, { "epoch": 0.01, "learning_rate": 1.4608433734939762e-06, "loss": 1.2377, "step": 291 }, { "epoch": 0.01, "learning_rate": 1.465863453815261e-06, "loss": 1.1615, "step": 292 }, { "epoch": 0.01, "learning_rate": 1.4708835341365463e-06, "loss": 1.1628, "step": 293 }, { "epoch": 0.01, "learning_rate": 1.4759036144578314e-06, "loss": 1.2023, "step": 294 }, { "epoch": 0.01, "learning_rate": 1.4809236947791166e-06, "loss": 1.2427, "step": 295 }, { "epoch": 0.01, "learning_rate": 1.4859437751004017e-06, "loss": 1.3179, "step": 296 }, { "epoch": 0.01, "learning_rate": 1.4909638554216867e-06, "loss": 1.2139, "step": 297 }, { "epoch": 0.01, "learning_rate": 1.495983935742972e-06, "loss": 1.163, "step": 298 }, { "epoch": 0.01, "learning_rate": 1.5010040160642573e-06, "loss": 1.2454, "step": 299 }, { "epoch": 0.01, "learning_rate": 1.5060240963855425e-06, "loss": 1.2241, "step": 300 }, { "epoch": 0.01, "learning_rate": 1.5110441767068274e-06, "loss": 1.1454, "step": 301 }, { "epoch": 0.01, "learning_rate": 1.5160642570281126e-06, "loss": 1.0392, "step": 302 }, { "epoch": 0.01, "learning_rate": 1.5210843373493977e-06, "loss": 1.1556, "step": 303 }, { "epoch": 0.01, "learning_rate": 1.526104417670683e-06, "loss": 1.1982, "step": 304 }, { "epoch": 0.01, "learning_rate": 1.531124497991968e-06, "loss": 1.1326, "step": 305 }, { "epoch": 0.01, "learning_rate": 1.536144578313253e-06, "loss": 1.2527, "step": 306 }, { "epoch": 0.01, "learning_rate": 1.5411646586345383e-06, "loss": 1.2538, "step": 307 }, { "epoch": 0.01, "learning_rate": 1.5461847389558236e-06, "loss": 1.2006, "step": 308 }, { "epoch": 0.01, "learning_rate": 1.5512048192771086e-06, "loss": 1.1517, "step": 309 }, { "epoch": 0.01, "learning_rate": 1.5562248995983937e-06, "loss": 1.2192, "step": 310 }, { "epoch": 0.01, "learning_rate": 1.561244979919679e-06, "loss": 1.2582, "step": 311 }, { "epoch": 0.01, "learning_rate": 1.566265060240964e-06, "loss": 1.3518, "step": 312 }, { "epoch": 0.01, "learning_rate": 1.5712851405622492e-06, "loss": 1.2488, "step": 313 }, { "epoch": 0.01, "learning_rate": 1.576305220883534e-06, "loss": 1.1938, "step": 314 }, { "epoch": 0.01, "learning_rate": 1.5813253012048193e-06, "loss": 1.09, "step": 315 }, { "epoch": 0.01, "learning_rate": 1.5863453815261046e-06, "loss": 1.3279, "step": 316 }, { "epoch": 0.01, "learning_rate": 1.5913654618473899e-06, "loss": 1.2167, "step": 317 }, { "epoch": 0.01, "learning_rate": 1.5963855421686747e-06, "loss": 1.2066, "step": 318 }, { "epoch": 0.01, "learning_rate": 1.60140562248996e-06, "loss": 1.1867, "step": 319 }, { "epoch": 0.01, "learning_rate": 1.606425702811245e-06, "loss": 1.2032, "step": 320 }, { "epoch": 0.01, "learning_rate": 1.6114457831325303e-06, "loss": 1.2404, "step": 321 }, { "epoch": 0.01, "learning_rate": 1.6164658634538155e-06, "loss": 1.2045, "step": 322 }, { "epoch": 0.01, "learning_rate": 1.6214859437751004e-06, "loss": 1.1906, "step": 323 }, { "epoch": 0.01, "learning_rate": 1.6265060240963856e-06, "loss": 1.1741, "step": 324 }, { "epoch": 0.01, "learning_rate": 1.6315261044176709e-06, "loss": 1.1714, "step": 325 }, { "epoch": 0.01, "learning_rate": 1.6365461847389562e-06, "loss": 1.185, "step": 326 }, { "epoch": 0.01, "learning_rate": 1.641566265060241e-06, "loss": 1.1835, "step": 327 }, { "epoch": 0.01, "learning_rate": 1.6465863453815263e-06, "loss": 1.1339, "step": 328 }, { "epoch": 0.01, "learning_rate": 1.6516064257028113e-06, "loss": 1.1839, "step": 329 }, { "epoch": 0.01, "learning_rate": 1.6566265060240966e-06, "loss": 1.1918, "step": 330 }, { "epoch": 0.01, "learning_rate": 1.6616465863453818e-06, "loss": 1.2167, "step": 331 }, { "epoch": 0.01, "learning_rate": 1.6666666666666667e-06, "loss": 1.1165, "step": 332 }, { "epoch": 0.01, "learning_rate": 1.671686746987952e-06, "loss": 1.131, "step": 333 }, { "epoch": 0.01, "learning_rate": 1.6767068273092372e-06, "loss": 1.2279, "step": 334 }, { "epoch": 0.01, "learning_rate": 1.6817269076305222e-06, "loss": 1.0715, "step": 335 }, { "epoch": 0.01, "learning_rate": 1.6867469879518073e-06, "loss": 1.2137, "step": 336 }, { "epoch": 0.01, "learning_rate": 1.6917670682730925e-06, "loss": 1.291, "step": 337 }, { "epoch": 0.01, "learning_rate": 1.6967871485943776e-06, "loss": 1.1602, "step": 338 }, { "epoch": 0.01, "learning_rate": 1.7018072289156629e-06, "loss": 1.2395, "step": 339 }, { "epoch": 0.01, "learning_rate": 1.7068273092369481e-06, "loss": 1.1719, "step": 340 }, { "epoch": 0.01, "learning_rate": 1.711847389558233e-06, "loss": 1.2139, "step": 341 }, { "epoch": 0.01, "learning_rate": 1.7168674698795182e-06, "loss": 1.1998, "step": 342 }, { "epoch": 0.01, "learning_rate": 1.7218875502008035e-06, "loss": 1.2675, "step": 343 }, { "epoch": 0.01, "learning_rate": 1.7269076305220885e-06, "loss": 1.2324, "step": 344 }, { "epoch": 0.01, "learning_rate": 1.7319277108433736e-06, "loss": 1.2469, "step": 345 }, { "epoch": 0.01, "learning_rate": 1.7369477911646586e-06, "loss": 1.1636, "step": 346 }, { "epoch": 0.01, "learning_rate": 1.7419678714859439e-06, "loss": 1.1909, "step": 347 }, { "epoch": 0.01, "learning_rate": 1.7469879518072292e-06, "loss": 1.2151, "step": 348 }, { "epoch": 0.01, "learning_rate": 1.7520080321285144e-06, "loss": 1.1005, "step": 349 }, { "epoch": 0.01, "learning_rate": 1.7570281124497993e-06, "loss": 1.2531, "step": 350 }, { "epoch": 0.01, "learning_rate": 1.7620481927710845e-06, "loss": 1.1937, "step": 351 }, { "epoch": 0.01, "learning_rate": 1.7670682730923696e-06, "loss": 1.0992, "step": 352 }, { "epoch": 0.01, "learning_rate": 1.7720883534136548e-06, "loss": 1.1724, "step": 353 }, { "epoch": 0.01, "learning_rate": 1.7771084337349399e-06, "loss": 1.2111, "step": 354 }, { "epoch": 0.01, "learning_rate": 1.782128514056225e-06, "loss": 1.2114, "step": 355 }, { "epoch": 0.01, "learning_rate": 1.7871485943775102e-06, "loss": 1.2166, "step": 356 }, { "epoch": 0.01, "learning_rate": 1.7921686746987955e-06, "loss": 1.3374, "step": 357 }, { "epoch": 0.01, "learning_rate": 1.7971887550200803e-06, "loss": 1.2357, "step": 358 }, { "epoch": 0.01, "learning_rate": 1.8022088353413656e-06, "loss": 1.1055, "step": 359 }, { "epoch": 0.01, "learning_rate": 1.8072289156626508e-06, "loss": 1.2325, "step": 360 }, { "epoch": 0.01, "learning_rate": 1.8122489959839359e-06, "loss": 1.2216, "step": 361 }, { "epoch": 0.01, "learning_rate": 1.8172690763052211e-06, "loss": 1.3123, "step": 362 }, { "epoch": 0.01, "learning_rate": 1.8222891566265062e-06, "loss": 1.118, "step": 363 }, { "epoch": 0.01, "learning_rate": 1.8273092369477912e-06, "loss": 1.2112, "step": 364 }, { "epoch": 0.01, "learning_rate": 1.8323293172690765e-06, "loss": 1.1956, "step": 365 }, { "epoch": 0.01, "learning_rate": 1.8373493975903617e-06, "loss": 1.2161, "step": 366 }, { "epoch": 0.01, "learning_rate": 1.8423694779116466e-06, "loss": 1.1689, "step": 367 }, { "epoch": 0.01, "learning_rate": 1.8473895582329318e-06, "loss": 1.1291, "step": 368 }, { "epoch": 0.01, "learning_rate": 1.8524096385542171e-06, "loss": 1.0608, "step": 369 }, { "epoch": 0.01, "learning_rate": 1.8574297188755022e-06, "loss": 1.1381, "step": 370 }, { "epoch": 0.01, "learning_rate": 1.8624497991967874e-06, "loss": 1.0233, "step": 371 }, { "epoch": 0.01, "learning_rate": 1.8674698795180723e-06, "loss": 1.2103, "step": 372 }, { "epoch": 0.01, "learning_rate": 1.8724899598393575e-06, "loss": 1.0747, "step": 373 }, { "epoch": 0.01, "learning_rate": 1.8775100401606428e-06, "loss": 1.3341, "step": 374 }, { "epoch": 0.01, "learning_rate": 1.882530120481928e-06, "loss": 1.105, "step": 375 }, { "epoch": 0.01, "learning_rate": 1.8875502008032129e-06, "loss": 1.1721, "step": 376 }, { "epoch": 0.01, "learning_rate": 1.8925702811244981e-06, "loss": 1.2074, "step": 377 }, { "epoch": 0.01, "learning_rate": 1.8975903614457832e-06, "loss": 1.1992, "step": 378 }, { "epoch": 0.01, "learning_rate": 1.9026104417670685e-06, "loss": 1.3135, "step": 379 }, { "epoch": 0.01, "learning_rate": 1.9076305220883537e-06, "loss": 1.2535, "step": 380 }, { "epoch": 0.01, "learning_rate": 1.9126506024096388e-06, "loss": 1.1398, "step": 381 }, { "epoch": 0.01, "learning_rate": 1.917670682730924e-06, "loss": 1.2048, "step": 382 }, { "epoch": 0.01, "learning_rate": 1.922690763052209e-06, "loss": 1.2257, "step": 383 }, { "epoch": 0.01, "learning_rate": 1.9277108433734943e-06, "loss": 1.1011, "step": 384 }, { "epoch": 0.01, "learning_rate": 1.932730923694779e-06, "loss": 1.2583, "step": 385 }, { "epoch": 0.01, "learning_rate": 1.9377510040160644e-06, "loss": 1.1926, "step": 386 }, { "epoch": 0.01, "learning_rate": 1.9427710843373495e-06, "loss": 1.1757, "step": 387 }, { "epoch": 0.01, "learning_rate": 1.947791164658635e-06, "loss": 1.2224, "step": 388 }, { "epoch": 0.01, "learning_rate": 1.95281124497992e-06, "loss": 1.1533, "step": 389 }, { "epoch": 0.01, "learning_rate": 1.957831325301205e-06, "loss": 1.2163, "step": 390 }, { "epoch": 0.01, "learning_rate": 1.96285140562249e-06, "loss": 1.2047, "step": 391 }, { "epoch": 0.01, "learning_rate": 1.967871485943775e-06, "loss": 1.1746, "step": 392 }, { "epoch": 0.01, "learning_rate": 1.9728915662650606e-06, "loss": 1.1678, "step": 393 }, { "epoch": 0.01, "learning_rate": 1.9779116465863453e-06, "loss": 1.1834, "step": 394 }, { "epoch": 0.01, "learning_rate": 1.9829317269076307e-06, "loss": 1.2194, "step": 395 }, { "epoch": 0.01, "learning_rate": 1.987951807228916e-06, "loss": 1.1625, "step": 396 }, { "epoch": 0.01, "learning_rate": 1.992971887550201e-06, "loss": 1.1104, "step": 397 }, { "epoch": 0.01, "learning_rate": 1.997991967871486e-06, "loss": 1.1923, "step": 398 }, { "epoch": 0.01, "learning_rate": 2.0030120481927714e-06, "loss": 1.2935, "step": 399 }, { "epoch": 0.01, "learning_rate": 2.0080321285140564e-06, "loss": 1.1905, "step": 400 }, { "epoch": 0.01, "learning_rate": 2.0130522088353415e-06, "loss": 1.2489, "step": 401 }, { "epoch": 0.01, "learning_rate": 2.018072289156627e-06, "loss": 1.2571, "step": 402 }, { "epoch": 0.01, "learning_rate": 2.0230923694779116e-06, "loss": 0.9643, "step": 403 }, { "epoch": 0.01, "learning_rate": 2.028112449799197e-06, "loss": 1.1662, "step": 404 }, { "epoch": 0.01, "learning_rate": 2.033132530120482e-06, "loss": 1.2767, "step": 405 }, { "epoch": 0.01, "learning_rate": 2.038152610441767e-06, "loss": 1.1814, "step": 406 }, { "epoch": 0.01, "learning_rate": 2.043172690763052e-06, "loss": 1.2408, "step": 407 }, { "epoch": 0.01, "learning_rate": 2.0481927710843377e-06, "loss": 1.1976, "step": 408 }, { "epoch": 0.01, "learning_rate": 2.0532128514056227e-06, "loss": 1.1796, "step": 409 }, { "epoch": 0.01, "learning_rate": 2.0582329317269078e-06, "loss": 1.1853, "step": 410 }, { "epoch": 0.01, "learning_rate": 2.0632530120481932e-06, "loss": 1.215, "step": 411 }, { "epoch": 0.01, "learning_rate": 2.068273092369478e-06, "loss": 1.1127, "step": 412 }, { "epoch": 0.01, "learning_rate": 2.0732931726907633e-06, "loss": 1.1558, "step": 413 }, { "epoch": 0.01, "learning_rate": 2.0783132530120484e-06, "loss": 1.1968, "step": 414 }, { "epoch": 0.01, "learning_rate": 2.0833333333333334e-06, "loss": 1.2405, "step": 415 }, { "epoch": 0.01, "learning_rate": 2.0883534136546185e-06, "loss": 1.1862, "step": 416 }, { "epoch": 0.01, "learning_rate": 2.0933734939759035e-06, "loss": 1.25, "step": 417 }, { "epoch": 0.01, "learning_rate": 2.098393574297189e-06, "loss": 1.1277, "step": 418 }, { "epoch": 0.01, "learning_rate": 2.103413654618474e-06, "loss": 1.192, "step": 419 }, { "epoch": 0.01, "learning_rate": 2.1084337349397595e-06, "loss": 1.2454, "step": 420 }, { "epoch": 0.01, "learning_rate": 2.113453815261044e-06, "loss": 1.1712, "step": 421 }, { "epoch": 0.01, "learning_rate": 2.1184738955823296e-06, "loss": 1.2356, "step": 422 }, { "epoch": 0.01, "learning_rate": 2.1234939759036147e-06, "loss": 1.1858, "step": 423 }, { "epoch": 0.01, "learning_rate": 2.1285140562248997e-06, "loss": 1.1556, "step": 424 }, { "epoch": 0.01, "learning_rate": 2.1335341365461848e-06, "loss": 1.3066, "step": 425 }, { "epoch": 0.01, "learning_rate": 2.13855421686747e-06, "loss": 1.1935, "step": 426 }, { "epoch": 0.01, "learning_rate": 2.1435742971887553e-06, "loss": 1.0922, "step": 427 }, { "epoch": 0.01, "learning_rate": 2.1485943775100404e-06, "loss": 1.0898, "step": 428 }, { "epoch": 0.01, "learning_rate": 2.1536144578313254e-06, "loss": 1.1514, "step": 429 }, { "epoch": 0.01, "learning_rate": 2.1586345381526105e-06, "loss": 1.3051, "step": 430 }, { "epoch": 0.01, "learning_rate": 2.163654618473896e-06, "loss": 1.2433, "step": 431 }, { "epoch": 0.01, "learning_rate": 2.168674698795181e-06, "loss": 1.1556, "step": 432 }, { "epoch": 0.01, "learning_rate": 2.173694779116466e-06, "loss": 1.1682, "step": 433 }, { "epoch": 0.01, "learning_rate": 2.178714859437751e-06, "loss": 1.2976, "step": 434 }, { "epoch": 0.01, "learning_rate": 2.183734939759036e-06, "loss": 1.1681, "step": 435 }, { "epoch": 0.01, "learning_rate": 2.1887550200803216e-06, "loss": 1.1198, "step": 436 }, { "epoch": 0.01, "learning_rate": 2.1937751004016067e-06, "loss": 1.3199, "step": 437 }, { "epoch": 0.01, "learning_rate": 2.1987951807228917e-06, "loss": 1.2086, "step": 438 }, { "epoch": 0.01, "learning_rate": 2.2038152610441768e-06, "loss": 1.1592, "step": 439 }, { "epoch": 0.01, "learning_rate": 2.2088353413654622e-06, "loss": 1.1182, "step": 440 }, { "epoch": 0.01, "learning_rate": 2.2138554216867473e-06, "loss": 1.1688, "step": 441 }, { "epoch": 0.01, "learning_rate": 2.2188755020080323e-06, "loss": 1.1967, "step": 442 }, { "epoch": 0.01, "learning_rate": 2.2238955823293174e-06, "loss": 1.1482, "step": 443 }, { "epoch": 0.01, "learning_rate": 2.2289156626506024e-06, "loss": 1.1002, "step": 444 }, { "epoch": 0.01, "learning_rate": 2.233935742971888e-06, "loss": 1.146, "step": 445 }, { "epoch": 0.01, "learning_rate": 2.238955823293173e-06, "loss": 1.204, "step": 446 }, { "epoch": 0.01, "learning_rate": 2.243975903614458e-06, "loss": 1.0905, "step": 447 }, { "epoch": 0.01, "learning_rate": 2.248995983935743e-06, "loss": 1.2334, "step": 448 }, { "epoch": 0.01, "learning_rate": 2.254016064257028e-06, "loss": 1.0965, "step": 449 }, { "epoch": 0.01, "learning_rate": 2.2590361445783136e-06, "loss": 1.2169, "step": 450 }, { "epoch": 0.01, "learning_rate": 2.2640562248995986e-06, "loss": 1.1136, "step": 451 }, { "epoch": 0.01, "learning_rate": 2.2690763052208837e-06, "loss": 1.1423, "step": 452 }, { "epoch": 0.01, "learning_rate": 2.2740963855421687e-06, "loss": 1.2517, "step": 453 }, { "epoch": 0.01, "learning_rate": 2.279116465863454e-06, "loss": 1.2709, "step": 454 }, { "epoch": 0.01, "learning_rate": 2.2841365461847392e-06, "loss": 1.1757, "step": 455 }, { "epoch": 0.01, "learning_rate": 2.2891566265060243e-06, "loss": 1.1052, "step": 456 }, { "epoch": 0.01, "learning_rate": 2.2941767068273093e-06, "loss": 1.1669, "step": 457 }, { "epoch": 0.01, "learning_rate": 2.2991967871485944e-06, "loss": 1.1641, "step": 458 }, { "epoch": 0.01, "learning_rate": 2.30421686746988e-06, "loss": 1.1581, "step": 459 }, { "epoch": 0.01, "learning_rate": 2.309236947791165e-06, "loss": 1.1927, "step": 460 }, { "epoch": 0.01, "learning_rate": 2.31425702811245e-06, "loss": 1.2747, "step": 461 }, { "epoch": 0.01, "learning_rate": 2.319277108433735e-06, "loss": 1.1104, "step": 462 }, { "epoch": 0.01, "learning_rate": 2.3242971887550205e-06, "loss": 1.1898, "step": 463 }, { "epoch": 0.01, "learning_rate": 2.3293172690763055e-06, "loss": 1.2172, "step": 464 }, { "epoch": 0.01, "learning_rate": 2.3343373493975906e-06, "loss": 1.212, "step": 465 }, { "epoch": 0.01, "learning_rate": 2.3393574297188756e-06, "loss": 1.1635, "step": 466 }, { "epoch": 0.01, "learning_rate": 2.3443775100401607e-06, "loss": 1.1473, "step": 467 }, { "epoch": 0.01, "learning_rate": 2.349397590361446e-06, "loss": 1.2173, "step": 468 }, { "epoch": 0.01, "learning_rate": 2.3544176706827312e-06, "loss": 1.0703, "step": 469 }, { "epoch": 0.01, "learning_rate": 2.3594377510040163e-06, "loss": 1.1794, "step": 470 }, { "epoch": 0.01, "learning_rate": 2.3644578313253013e-06, "loss": 1.1543, "step": 471 }, { "epoch": 0.01, "learning_rate": 2.3694779116465868e-06, "loss": 1.0568, "step": 472 }, { "epoch": 0.01, "learning_rate": 2.374497991967872e-06, "loss": 1.2534, "step": 473 }, { "epoch": 0.01, "learning_rate": 2.379518072289157e-06, "loss": 1.2385, "step": 474 }, { "epoch": 0.01, "learning_rate": 2.384538152610442e-06, "loss": 1.1198, "step": 475 }, { "epoch": 0.01, "learning_rate": 2.389558232931727e-06, "loss": 1.1227, "step": 476 }, { "epoch": 0.01, "learning_rate": 2.3945783132530125e-06, "loss": 1.213, "step": 477 }, { "epoch": 0.01, "learning_rate": 2.399598393574297e-06, "loss": 1.1208, "step": 478 }, { "epoch": 0.01, "learning_rate": 2.4046184738955826e-06, "loss": 1.2943, "step": 479 }, { "epoch": 0.01, "learning_rate": 2.4096385542168676e-06, "loss": 1.1614, "step": 480 }, { "epoch": 0.01, "learning_rate": 2.4146586345381527e-06, "loss": 1.2052, "step": 481 }, { "epoch": 0.01, "learning_rate": 2.419678714859438e-06, "loss": 1.0342, "step": 482 }, { "epoch": 0.01, "learning_rate": 2.424698795180723e-06, "loss": 1.1041, "step": 483 }, { "epoch": 0.01, "learning_rate": 2.4297188755020082e-06, "loss": 1.2192, "step": 484 }, { "epoch": 0.01, "learning_rate": 2.4347389558232933e-06, "loss": 1.17, "step": 485 }, { "epoch": 0.01, "learning_rate": 2.4397590361445788e-06, "loss": 1.1792, "step": 486 }, { "epoch": 0.01, "learning_rate": 2.4447791164658634e-06, "loss": 1.2184, "step": 487 }, { "epoch": 0.01, "learning_rate": 2.449799196787149e-06, "loss": 1.0862, "step": 488 }, { "epoch": 0.01, "learning_rate": 2.454819277108434e-06, "loss": 1.1874, "step": 489 }, { "epoch": 0.01, "learning_rate": 2.459839357429719e-06, "loss": 1.1653, "step": 490 }, { "epoch": 0.01, "learning_rate": 2.4648594377510044e-06, "loss": 1.1931, "step": 491 }, { "epoch": 0.01, "learning_rate": 2.469879518072289e-06, "loss": 1.2485, "step": 492 }, { "epoch": 0.01, "learning_rate": 2.4748995983935745e-06, "loss": 1.2372, "step": 493 }, { "epoch": 0.01, "learning_rate": 2.4799196787148596e-06, "loss": 1.2213, "step": 494 }, { "epoch": 0.01, "learning_rate": 2.484939759036145e-06, "loss": 1.1373, "step": 495 }, { "epoch": 0.01, "learning_rate": 2.4899598393574297e-06, "loss": 1.1546, "step": 496 }, { "epoch": 0.01, "learning_rate": 2.494979919678715e-06, "loss": 1.001, "step": 497 }, { "epoch": 0.02, "learning_rate": 2.5e-06, "loss": 1.1764, "step": 498 }, { "epoch": 0.02, "learning_rate": 2.5050200803212853e-06, "loss": 1.2568, "step": 499 }, { "epoch": 0.02, "learning_rate": 2.5100401606425707e-06, "loss": 1.3071, "step": 500 }, { "epoch": 0.02, "learning_rate": 2.5150602409638558e-06, "loss": 1.1647, "step": 501 }, { "epoch": 0.02, "learning_rate": 2.520080321285141e-06, "loss": 1.1989, "step": 502 }, { "epoch": 0.02, "learning_rate": 2.525100401606426e-06, "loss": 1.1036, "step": 503 }, { "epoch": 0.02, "learning_rate": 2.530120481927711e-06, "loss": 1.1436, "step": 504 }, { "epoch": 0.02, "learning_rate": 2.535140562248996e-06, "loss": 1.1364, "step": 505 }, { "epoch": 0.02, "learning_rate": 2.5401606425702815e-06, "loss": 1.2365, "step": 506 }, { "epoch": 0.02, "learning_rate": 2.5451807228915665e-06, "loss": 1.1926, "step": 507 }, { "epoch": 0.02, "learning_rate": 2.5502008032128516e-06, "loss": 1.17, "step": 508 }, { "epoch": 0.02, "learning_rate": 2.555220883534137e-06, "loss": 1.2609, "step": 509 }, { "epoch": 0.02, "learning_rate": 2.560240963855422e-06, "loss": 1.2097, "step": 510 }, { "epoch": 0.02, "learning_rate": 2.565261044176707e-06, "loss": 1.2088, "step": 511 }, { "epoch": 0.02, "learning_rate": 2.5702811244979918e-06, "loss": 1.2088, "step": 512 }, { "epoch": 0.02, "learning_rate": 2.5753012048192772e-06, "loss": 1.2214, "step": 513 }, { "epoch": 0.02, "learning_rate": 2.5803212851405623e-06, "loss": 1.1436, "step": 514 }, { "epoch": 0.02, "learning_rate": 2.5853413654618477e-06, "loss": 1.0466, "step": 515 }, { "epoch": 0.02, "learning_rate": 2.590361445783133e-06, "loss": 1.115, "step": 516 }, { "epoch": 0.02, "learning_rate": 2.595381526104418e-06, "loss": 1.1993, "step": 517 }, { "epoch": 0.02, "learning_rate": 2.6004016064257033e-06, "loss": 1.1859, "step": 518 }, { "epoch": 0.02, "learning_rate": 2.6054216867469884e-06, "loss": 1.1805, "step": 519 }, { "epoch": 0.02, "learning_rate": 2.6104417670682734e-06, "loss": 1.205, "step": 520 }, { "epoch": 0.02, "learning_rate": 2.615461847389558e-06, "loss": 1.2191, "step": 521 }, { "epoch": 0.02, "learning_rate": 2.6204819277108435e-06, "loss": 1.0483, "step": 522 }, { "epoch": 0.02, "learning_rate": 2.6255020080321286e-06, "loss": 1.271, "step": 523 }, { "epoch": 0.02, "learning_rate": 2.6305220883534136e-06, "loss": 1.1379, "step": 524 }, { "epoch": 0.02, "learning_rate": 2.635542168674699e-06, "loss": 1.2911, "step": 525 }, { "epoch": 0.02, "learning_rate": 2.640562248995984e-06, "loss": 1.1744, "step": 526 }, { "epoch": 0.02, "learning_rate": 2.6455823293172696e-06, "loss": 1.0969, "step": 527 }, { "epoch": 0.02, "learning_rate": 2.6506024096385547e-06, "loss": 1.2247, "step": 528 }, { "epoch": 0.02, "learning_rate": 2.6556224899598397e-06, "loss": 1.2526, "step": 529 }, { "epoch": 0.02, "learning_rate": 2.6606425702811243e-06, "loss": 1.2623, "step": 530 }, { "epoch": 0.02, "learning_rate": 2.66566265060241e-06, "loss": 1.207, "step": 531 }, { "epoch": 0.02, "learning_rate": 2.670682730923695e-06, "loss": 1.0773, "step": 532 }, { "epoch": 0.02, "learning_rate": 2.67570281124498e-06, "loss": 1.2032, "step": 533 }, { "epoch": 0.02, "learning_rate": 2.6807228915662654e-06, "loss": 1.1102, "step": 534 }, { "epoch": 0.02, "learning_rate": 2.6857429718875504e-06, "loss": 1.237, "step": 535 }, { "epoch": 0.02, "learning_rate": 2.690763052208836e-06, "loss": 1.1904, "step": 536 }, { "epoch": 0.02, "learning_rate": 2.695783132530121e-06, "loss": 1.2063, "step": 537 }, { "epoch": 0.02, "learning_rate": 2.700803212851406e-06, "loss": 1.2887, "step": 538 }, { "epoch": 0.02, "learning_rate": 2.7058232931726906e-06, "loss": 1.1348, "step": 539 }, { "epoch": 0.02, "learning_rate": 2.710843373493976e-06, "loss": 1.166, "step": 540 }, { "epoch": 0.02, "learning_rate": 2.715863453815261e-06, "loss": 1.2218, "step": 541 }, { "epoch": 0.02, "learning_rate": 2.7208835341365462e-06, "loss": 1.2759, "step": 542 }, { "epoch": 0.02, "learning_rate": 2.7259036144578317e-06, "loss": 1.1385, "step": 543 }, { "epoch": 0.02, "learning_rate": 2.7309236947791167e-06, "loss": 1.0538, "step": 544 }, { "epoch": 0.02, "learning_rate": 2.735943775100402e-06, "loss": 1.1441, "step": 545 }, { "epoch": 0.02, "learning_rate": 2.7409638554216873e-06, "loss": 1.2615, "step": 546 }, { "epoch": 0.02, "learning_rate": 2.745983935742972e-06, "loss": 1.192, "step": 547 }, { "epoch": 0.02, "learning_rate": 2.751004016064257e-06, "loss": 1.2115, "step": 548 }, { "epoch": 0.02, "learning_rate": 2.7560240963855424e-06, "loss": 1.1034, "step": 549 }, { "epoch": 0.02, "learning_rate": 2.7610441767068275e-06, "loss": 1.1382, "step": 550 }, { "epoch": 0.02, "learning_rate": 2.7660642570281125e-06, "loss": 1.2318, "step": 551 }, { "epoch": 0.02, "learning_rate": 2.771084337349398e-06, "loss": 1.2134, "step": 552 }, { "epoch": 0.02, "learning_rate": 2.776104417670683e-06, "loss": 1.1697, "step": 553 }, { "epoch": 0.02, "learning_rate": 2.781124497991968e-06, "loss": 1.1258, "step": 554 }, { "epoch": 0.02, "learning_rate": 2.7861445783132536e-06, "loss": 1.1729, "step": 555 }, { "epoch": 0.02, "learning_rate": 2.791164658634538e-06, "loss": 1.2006, "step": 556 }, { "epoch": 0.02, "learning_rate": 2.7961847389558232e-06, "loss": 1.2927, "step": 557 }, { "epoch": 0.02, "learning_rate": 2.8012048192771087e-06, "loss": 1.2198, "step": 558 }, { "epoch": 0.02, "learning_rate": 2.8062248995983938e-06, "loss": 1.187, "step": 559 }, { "epoch": 0.02, "learning_rate": 2.811244979919679e-06, "loss": 1.2356, "step": 560 }, { "epoch": 0.02, "learning_rate": 2.8162650602409643e-06, "loss": 1.2475, "step": 561 }, { "epoch": 0.02, "learning_rate": 2.8212851405622493e-06, "loss": 1.212, "step": 562 }, { "epoch": 0.02, "learning_rate": 2.8263052208835344e-06, "loss": 1.2125, "step": 563 }, { "epoch": 0.02, "learning_rate": 2.83132530120482e-06, "loss": 1.2113, "step": 564 }, { "epoch": 0.02, "learning_rate": 2.8363453815261045e-06, "loss": 1.1117, "step": 565 }, { "epoch": 0.02, "learning_rate": 2.8413654618473895e-06, "loss": 1.1824, "step": 566 }, { "epoch": 0.02, "learning_rate": 2.846385542168675e-06, "loss": 1.1953, "step": 567 }, { "epoch": 0.02, "learning_rate": 2.85140562248996e-06, "loss": 1.1313, "step": 568 }, { "epoch": 0.02, "learning_rate": 2.856425702811245e-06, "loss": 1.2103, "step": 569 }, { "epoch": 0.02, "learning_rate": 2.8614457831325306e-06, "loss": 1.2441, "step": 570 }, { "epoch": 0.02, "learning_rate": 2.8664658634538156e-06, "loss": 1.1554, "step": 571 }, { "epoch": 0.02, "learning_rate": 2.8714859437751007e-06, "loss": 1.0688, "step": 572 }, { "epoch": 0.02, "learning_rate": 2.876506024096386e-06, "loss": 1.1511, "step": 573 }, { "epoch": 0.02, "learning_rate": 2.8815261044176708e-06, "loss": 1.3375, "step": 574 }, { "epoch": 0.02, "learning_rate": 2.886546184738956e-06, "loss": 1.3309, "step": 575 }, { "epoch": 0.02, "learning_rate": 2.891566265060241e-06, "loss": 1.2534, "step": 576 }, { "epoch": 0.02, "learning_rate": 2.8965863453815264e-06, "loss": 1.1337, "step": 577 }, { "epoch": 0.02, "learning_rate": 2.9016064257028114e-06, "loss": 1.1599, "step": 578 }, { "epoch": 0.02, "learning_rate": 2.906626506024097e-06, "loss": 1.1726, "step": 579 }, { "epoch": 0.02, "learning_rate": 2.911646586345382e-06, "loss": 1.2249, "step": 580 }, { "epoch": 0.02, "learning_rate": 2.916666666666667e-06, "loss": 1.2438, "step": 581 }, { "epoch": 0.02, "learning_rate": 2.9216867469879524e-06, "loss": 1.2019, "step": 582 }, { "epoch": 0.02, "learning_rate": 2.926706827309237e-06, "loss": 1.2097, "step": 583 }, { "epoch": 0.02, "learning_rate": 2.931726907630522e-06, "loss": 1.1197, "step": 584 }, { "epoch": 0.02, "learning_rate": 2.936746987951807e-06, "loss": 1.2189, "step": 585 }, { "epoch": 0.02, "learning_rate": 2.9417670682730926e-06, "loss": 1.2117, "step": 586 }, { "epoch": 0.02, "learning_rate": 2.9467871485943777e-06, "loss": 1.2493, "step": 587 }, { "epoch": 0.02, "learning_rate": 2.9518072289156627e-06, "loss": 1.2043, "step": 588 }, { "epoch": 0.02, "learning_rate": 2.9568273092369482e-06, "loss": 1.178, "step": 589 }, { "epoch": 0.02, "learning_rate": 2.9618473895582333e-06, "loss": 1.1683, "step": 590 }, { "epoch": 0.02, "learning_rate": 2.9668674698795187e-06, "loss": 1.1815, "step": 591 }, { "epoch": 0.02, "learning_rate": 2.9718875502008034e-06, "loss": 1.1632, "step": 592 }, { "epoch": 0.02, "learning_rate": 2.9769076305220884e-06, "loss": 1.2046, "step": 593 }, { "epoch": 0.02, "learning_rate": 2.9819277108433735e-06, "loss": 1.1616, "step": 594 }, { "epoch": 0.02, "learning_rate": 2.986947791164659e-06, "loss": 1.2184, "step": 595 }, { "epoch": 0.02, "learning_rate": 2.991967871485944e-06, "loss": 1.1403, "step": 596 }, { "epoch": 0.02, "learning_rate": 2.996987951807229e-06, "loss": 1.1066, "step": 597 }, { "epoch": 0.02, "learning_rate": 3.0020080321285145e-06, "loss": 1.3006, "step": 598 }, { "epoch": 0.02, "learning_rate": 3.0070281124497996e-06, "loss": 1.1857, "step": 599 }, { "epoch": 0.02, "learning_rate": 3.012048192771085e-06, "loss": 1.1275, "step": 600 }, { "epoch": 0.02, "learning_rate": 3.0170682730923697e-06, "loss": 1.1747, "step": 601 }, { "epoch": 0.02, "learning_rate": 3.0220883534136547e-06, "loss": 1.2317, "step": 602 }, { "epoch": 0.02, "learning_rate": 3.0271084337349398e-06, "loss": 1.0913, "step": 603 }, { "epoch": 0.02, "learning_rate": 3.0321285140562252e-06, "loss": 1.1472, "step": 604 }, { "epoch": 0.02, "learning_rate": 3.0371485943775103e-06, "loss": 1.181, "step": 605 }, { "epoch": 0.02, "learning_rate": 3.0421686746987953e-06, "loss": 1.1639, "step": 606 }, { "epoch": 0.02, "learning_rate": 3.047188755020081e-06, "loss": 1.0945, "step": 607 }, { "epoch": 0.02, "learning_rate": 3.052208835341366e-06, "loss": 1.2145, "step": 608 }, { "epoch": 0.02, "learning_rate": 3.057228915662651e-06, "loss": 1.0829, "step": 609 }, { "epoch": 0.02, "learning_rate": 3.062248995983936e-06, "loss": 1.1107, "step": 610 }, { "epoch": 0.02, "learning_rate": 3.067269076305221e-06, "loss": 1.1605, "step": 611 }, { "epoch": 0.02, "learning_rate": 3.072289156626506e-06, "loss": 1.1741, "step": 612 }, { "epoch": 0.02, "learning_rate": 3.0773092369477915e-06, "loss": 1.1684, "step": 613 }, { "epoch": 0.02, "learning_rate": 3.0823293172690766e-06, "loss": 1.1579, "step": 614 }, { "epoch": 0.02, "learning_rate": 3.0873493975903616e-06, "loss": 1.2404, "step": 615 }, { "epoch": 0.02, "learning_rate": 3.092369477911647e-06, "loss": 1.1518, "step": 616 }, { "epoch": 0.02, "learning_rate": 3.097389558232932e-06, "loss": 1.1941, "step": 617 }, { "epoch": 0.02, "learning_rate": 3.1024096385542172e-06, "loss": 1.212, "step": 618 }, { "epoch": 0.02, "learning_rate": 3.107429718875502e-06, "loss": 1.0948, "step": 619 }, { "epoch": 0.02, "learning_rate": 3.1124497991967873e-06, "loss": 1.1985, "step": 620 }, { "epoch": 0.02, "learning_rate": 3.1174698795180724e-06, "loss": 1.0709, "step": 621 }, { "epoch": 0.02, "learning_rate": 3.122489959839358e-06, "loss": 1.1178, "step": 622 }, { "epoch": 0.02, "learning_rate": 3.127510040160643e-06, "loss": 1.2018, "step": 623 }, { "epoch": 0.02, "learning_rate": 3.132530120481928e-06, "loss": 0.9734, "step": 624 }, { "epoch": 0.02, "learning_rate": 3.1375502008032134e-06, "loss": 1.1774, "step": 625 }, { "epoch": 0.02, "learning_rate": 3.1425702811244985e-06, "loss": 1.1783, "step": 626 }, { "epoch": 0.02, "learning_rate": 3.147590361445783e-06, "loss": 1.083, "step": 627 }, { "epoch": 0.02, "learning_rate": 3.152610441767068e-06, "loss": 1.1686, "step": 628 }, { "epoch": 0.02, "learning_rate": 3.1576305220883536e-06, "loss": 1.1891, "step": 629 }, { "epoch": 0.02, "learning_rate": 3.1626506024096387e-06, "loss": 1.2729, "step": 630 }, { "epoch": 0.02, "learning_rate": 3.167670682730924e-06, "loss": 1.1238, "step": 631 }, { "epoch": 0.02, "learning_rate": 3.172690763052209e-06, "loss": 1.1558, "step": 632 }, { "epoch": 0.02, "learning_rate": 3.1777108433734942e-06, "loss": 1.1774, "step": 633 }, { "epoch": 0.02, "learning_rate": 3.1827309236947797e-06, "loss": 1.1907, "step": 634 }, { "epoch": 0.02, "learning_rate": 3.1877510040160648e-06, "loss": 1.1663, "step": 635 }, { "epoch": 0.02, "learning_rate": 3.1927710843373494e-06, "loss": 1.255, "step": 636 }, { "epoch": 0.02, "learning_rate": 3.1977911646586344e-06, "loss": 1.205, "step": 637 }, { "epoch": 0.02, "learning_rate": 3.20281124497992e-06, "loss": 1.202, "step": 638 }, { "epoch": 0.02, "learning_rate": 3.207831325301205e-06, "loss": 1.1733, "step": 639 }, { "epoch": 0.02, "learning_rate": 3.21285140562249e-06, "loss": 1.174, "step": 640 }, { "epoch": 0.02, "learning_rate": 3.2178714859437755e-06, "loss": 1.1836, "step": 641 }, { "epoch": 0.02, "learning_rate": 3.2228915662650605e-06, "loss": 1.1837, "step": 642 }, { "epoch": 0.02, "learning_rate": 3.227911646586346e-06, "loss": 1.1914, "step": 643 }, { "epoch": 0.02, "learning_rate": 3.232931726907631e-06, "loss": 1.1087, "step": 644 }, { "epoch": 0.02, "learning_rate": 3.2379518072289157e-06, "loss": 1.189, "step": 645 }, { "epoch": 0.02, "learning_rate": 3.2429718875502007e-06, "loss": 1.1396, "step": 646 }, { "epoch": 0.02, "learning_rate": 3.247991967871486e-06, "loss": 1.1616, "step": 647 }, { "epoch": 0.02, "learning_rate": 3.2530120481927713e-06, "loss": 1.1066, "step": 648 }, { "epoch": 0.02, "learning_rate": 3.2580321285140563e-06, "loss": 1.0612, "step": 649 }, { "epoch": 0.02, "learning_rate": 3.2630522088353418e-06, "loss": 1.2165, "step": 650 }, { "epoch": 0.02, "learning_rate": 3.268072289156627e-06, "loss": 1.1463, "step": 651 }, { "epoch": 0.02, "learning_rate": 3.2730923694779123e-06, "loss": 1.1987, "step": 652 }, { "epoch": 0.02, "learning_rate": 3.2781124497991974e-06, "loss": 1.1287, "step": 653 }, { "epoch": 0.02, "learning_rate": 3.283132530120482e-06, "loss": 0.945, "step": 654 }, { "epoch": 0.02, "learning_rate": 3.288152610441767e-06, "loss": 1.1806, "step": 655 }, { "epoch": 0.02, "learning_rate": 3.2931726907630525e-06, "loss": 1.161, "step": 656 }, { "epoch": 0.02, "learning_rate": 3.2981927710843376e-06, "loss": 1.0748, "step": 657 }, { "epoch": 0.02, "learning_rate": 3.3032128514056226e-06, "loss": 1.2085, "step": 658 }, { "epoch": 0.02, "learning_rate": 3.308232931726908e-06, "loss": 1.243, "step": 659 }, { "epoch": 0.02, "learning_rate": 3.313253012048193e-06, "loss": 1.0631, "step": 660 }, { "epoch": 0.02, "learning_rate": 3.318273092369478e-06, "loss": 1.2524, "step": 661 }, { "epoch": 0.02, "learning_rate": 3.3232931726907636e-06, "loss": 1.1423, "step": 662 }, { "epoch": 0.02, "learning_rate": 3.3283132530120483e-06, "loss": 1.2026, "step": 663 }, { "epoch": 0.02, "learning_rate": 3.3333333333333333e-06, "loss": 1.124, "step": 664 }, { "epoch": 0.02, "learning_rate": 3.338353413654619e-06, "loss": 1.0865, "step": 665 }, { "epoch": 0.02, "learning_rate": 3.343373493975904e-06, "loss": 1.1572, "step": 666 }, { "epoch": 0.02, "learning_rate": 3.348393574297189e-06, "loss": 1.1689, "step": 667 }, { "epoch": 0.02, "learning_rate": 3.3534136546184744e-06, "loss": 1.3318, "step": 668 }, { "epoch": 0.02, "learning_rate": 3.3584337349397594e-06, "loss": 1.2412, "step": 669 }, { "epoch": 0.02, "learning_rate": 3.3634538152610445e-06, "loss": 1.128, "step": 670 }, { "epoch": 0.02, "learning_rate": 3.36847389558233e-06, "loss": 1.1482, "step": 671 }, { "epoch": 0.02, "learning_rate": 3.3734939759036146e-06, "loss": 1.1898, "step": 672 }, { "epoch": 0.02, "learning_rate": 3.3785140562248996e-06, "loss": 1.2017, "step": 673 }, { "epoch": 0.02, "learning_rate": 3.383534136546185e-06, "loss": 1.1882, "step": 674 }, { "epoch": 0.02, "learning_rate": 3.38855421686747e-06, "loss": 1.1981, "step": 675 }, { "epoch": 0.02, "learning_rate": 3.393574297188755e-06, "loss": 1.1197, "step": 676 }, { "epoch": 0.02, "learning_rate": 3.3985943775100407e-06, "loss": 1.1023, "step": 677 }, { "epoch": 0.02, "learning_rate": 3.4036144578313257e-06, "loss": 1.1816, "step": 678 }, { "epoch": 0.02, "learning_rate": 3.4086345381526108e-06, "loss": 1.1912, "step": 679 }, { "epoch": 0.02, "learning_rate": 3.4136546184738962e-06, "loss": 1.2328, "step": 680 }, { "epoch": 0.02, "learning_rate": 3.418674698795181e-06, "loss": 1.161, "step": 681 }, { "epoch": 0.02, "learning_rate": 3.423694779116466e-06, "loss": 1.231, "step": 682 }, { "epoch": 0.02, "learning_rate": 3.428714859437751e-06, "loss": 1.1907, "step": 683 }, { "epoch": 0.02, "learning_rate": 3.4337349397590364e-06, "loss": 1.1454, "step": 684 }, { "epoch": 0.02, "learning_rate": 3.4387550200803215e-06, "loss": 1.1617, "step": 685 }, { "epoch": 0.02, "learning_rate": 3.443775100401607e-06, "loss": 1.0974, "step": 686 }, { "epoch": 0.02, "learning_rate": 3.448795180722892e-06, "loss": 1.2363, "step": 687 }, { "epoch": 0.02, "learning_rate": 3.453815261044177e-06, "loss": 1.0786, "step": 688 }, { "epoch": 0.02, "learning_rate": 3.4588353413654625e-06, "loss": 1.2175, "step": 689 }, { "epoch": 0.02, "learning_rate": 3.463855421686747e-06, "loss": 1.2083, "step": 690 }, { "epoch": 0.02, "learning_rate": 3.4688755020080322e-06, "loss": 1.2068, "step": 691 }, { "epoch": 0.02, "learning_rate": 3.4738955823293173e-06, "loss": 1.1506, "step": 692 }, { "epoch": 0.02, "learning_rate": 3.4789156626506027e-06, "loss": 1.0679, "step": 693 }, { "epoch": 0.02, "learning_rate": 3.4839357429718878e-06, "loss": 1.2758, "step": 694 }, { "epoch": 0.02, "learning_rate": 3.4889558232931733e-06, "loss": 1.2507, "step": 695 }, { "epoch": 0.02, "learning_rate": 3.4939759036144583e-06, "loss": 1.1918, "step": 696 }, { "epoch": 0.02, "learning_rate": 3.4989959839357434e-06, "loss": 1.1268, "step": 697 }, { "epoch": 0.02, "learning_rate": 3.504016064257029e-06, "loss": 1.2251, "step": 698 }, { "epoch": 0.02, "learning_rate": 3.5090361445783135e-06, "loss": 1.2472, "step": 699 }, { "epoch": 0.02, "learning_rate": 3.5140562248995985e-06, "loss": 1.0486, "step": 700 }, { "epoch": 0.02, "learning_rate": 3.5190763052208836e-06, "loss": 1.1672, "step": 701 }, { "epoch": 0.02, "learning_rate": 3.524096385542169e-06, "loss": 1.2443, "step": 702 }, { "epoch": 0.02, "learning_rate": 3.529116465863454e-06, "loss": 1.2083, "step": 703 }, { "epoch": 0.02, "learning_rate": 3.534136546184739e-06, "loss": 1.1537, "step": 704 }, { "epoch": 0.02, "learning_rate": 3.5391566265060246e-06, "loss": 1.1952, "step": 705 }, { "epoch": 0.02, "learning_rate": 3.5441767068273097e-06, "loss": 1.3051, "step": 706 }, { "epoch": 0.02, "learning_rate": 3.5491967871485943e-06, "loss": 1.1139, "step": 707 }, { "epoch": 0.02, "learning_rate": 3.5542168674698798e-06, "loss": 1.166, "step": 708 }, { "epoch": 0.02, "learning_rate": 3.559236947791165e-06, "loss": 1.0823, "step": 709 }, { "epoch": 0.02, "learning_rate": 3.56425702811245e-06, "loss": 1.1886, "step": 710 }, { "epoch": 0.02, "learning_rate": 3.5692771084337353e-06, "loss": 1.2087, "step": 711 }, { "epoch": 0.02, "learning_rate": 3.5742971887550204e-06, "loss": 1.1559, "step": 712 }, { "epoch": 0.02, "learning_rate": 3.5793172690763054e-06, "loss": 1.1663, "step": 713 }, { "epoch": 0.02, "learning_rate": 3.584337349397591e-06, "loss": 1.2113, "step": 714 }, { "epoch": 0.02, "learning_rate": 3.589357429718876e-06, "loss": 1.1192, "step": 715 }, { "epoch": 0.02, "learning_rate": 3.5943775100401606e-06, "loss": 1.2707, "step": 716 }, { "epoch": 0.02, "learning_rate": 3.599397590361446e-06, "loss": 1.236, "step": 717 }, { "epoch": 0.02, "learning_rate": 3.604417670682731e-06, "loss": 1.2584, "step": 718 }, { "epoch": 0.02, "learning_rate": 3.609437751004016e-06, "loss": 1.1155, "step": 719 }, { "epoch": 0.02, "learning_rate": 3.6144578313253016e-06, "loss": 1.1029, "step": 720 }, { "epoch": 0.02, "learning_rate": 3.6194779116465867e-06, "loss": 1.1742, "step": 721 }, { "epoch": 0.02, "learning_rate": 3.6244979919678717e-06, "loss": 1.12, "step": 722 }, { "epoch": 0.02, "learning_rate": 3.629518072289157e-06, "loss": 1.166, "step": 723 }, { "epoch": 0.02, "learning_rate": 3.6345381526104423e-06, "loss": 1.1995, "step": 724 }, { "epoch": 0.02, "learning_rate": 3.639558232931727e-06, "loss": 1.203, "step": 725 }, { "epoch": 0.02, "learning_rate": 3.6445783132530124e-06, "loss": 1.0984, "step": 726 }, { "epoch": 0.02, "learning_rate": 3.6495983935742974e-06, "loss": 1.271, "step": 727 }, { "epoch": 0.02, "learning_rate": 3.6546184738955825e-06, "loss": 1.1285, "step": 728 }, { "epoch": 0.02, "learning_rate": 3.659638554216868e-06, "loss": 1.1595, "step": 729 }, { "epoch": 0.02, "learning_rate": 3.664658634538153e-06, "loss": 1.0826, "step": 730 }, { "epoch": 0.02, "learning_rate": 3.669678714859438e-06, "loss": 1.1198, "step": 731 }, { "epoch": 0.02, "learning_rate": 3.6746987951807235e-06, "loss": 1.2574, "step": 732 }, { "epoch": 0.02, "learning_rate": 3.6797188755020085e-06, "loss": 1.1336, "step": 733 }, { "epoch": 0.02, "learning_rate": 3.684738955823293e-06, "loss": 1.225, "step": 734 }, { "epoch": 0.02, "learning_rate": 3.6897590361445782e-06, "loss": 1.1661, "step": 735 }, { "epoch": 0.02, "learning_rate": 3.6947791164658637e-06, "loss": 1.2579, "step": 736 }, { "epoch": 0.02, "learning_rate": 3.6997991967871487e-06, "loss": 1.058, "step": 737 }, { "epoch": 0.02, "learning_rate": 3.7048192771084342e-06, "loss": 1.1254, "step": 738 }, { "epoch": 0.02, "learning_rate": 3.7098393574297193e-06, "loss": 1.2144, "step": 739 }, { "epoch": 0.02, "learning_rate": 3.7148594377510043e-06, "loss": 1.1376, "step": 740 }, { "epoch": 0.02, "learning_rate": 3.71987951807229e-06, "loss": 1.1866, "step": 741 }, { "epoch": 0.02, "learning_rate": 3.724899598393575e-06, "loss": 1.1795, "step": 742 }, { "epoch": 0.02, "learning_rate": 3.7299196787148595e-06, "loss": 1.1188, "step": 743 }, { "epoch": 0.02, "learning_rate": 3.7349397590361445e-06, "loss": 1.2007, "step": 744 }, { "epoch": 0.02, "learning_rate": 3.73995983935743e-06, "loss": 1.0975, "step": 745 }, { "epoch": 0.02, "learning_rate": 3.744979919678715e-06, "loss": 1.1866, "step": 746 }, { "epoch": 0.02, "learning_rate": 3.7500000000000005e-06, "loss": 1.1664, "step": 747 }, { "epoch": 0.02, "learning_rate": 3.7550200803212856e-06, "loss": 1.1823, "step": 748 }, { "epoch": 0.02, "learning_rate": 3.7600401606425706e-06, "loss": 1.1309, "step": 749 }, { "epoch": 0.02, "learning_rate": 3.765060240963856e-06, "loss": 1.2036, "step": 750 }, { "epoch": 0.02, "learning_rate": 3.770080321285141e-06, "loss": 1.2324, "step": 751 }, { "epoch": 0.02, "learning_rate": 3.7751004016064258e-06, "loss": 1.1739, "step": 752 }, { "epoch": 0.02, "learning_rate": 3.780120481927711e-06, "loss": 1.0905, "step": 753 }, { "epoch": 0.02, "learning_rate": 3.7851405622489963e-06, "loss": 1.1924, "step": 754 }, { "epoch": 0.02, "learning_rate": 3.7901606425702813e-06, "loss": 1.2185, "step": 755 }, { "epoch": 0.02, "learning_rate": 3.7951807228915664e-06, "loss": 1.1776, "step": 756 }, { "epoch": 0.02, "learning_rate": 3.800200803212852e-06, "loss": 1.1347, "step": 757 }, { "epoch": 0.02, "learning_rate": 3.805220883534137e-06, "loss": 1.1628, "step": 758 }, { "epoch": 0.02, "learning_rate": 3.8102409638554224e-06, "loss": 1.1449, "step": 759 }, { "epoch": 0.02, "learning_rate": 3.8152610441767074e-06, "loss": 1.1294, "step": 760 }, { "epoch": 0.02, "learning_rate": 3.820281124497992e-06, "loss": 1.2632, "step": 761 }, { "epoch": 0.02, "learning_rate": 3.8253012048192775e-06, "loss": 1.2375, "step": 762 }, { "epoch": 0.02, "learning_rate": 3.830321285140562e-06, "loss": 1.2219, "step": 763 }, { "epoch": 0.02, "learning_rate": 3.835341365461848e-06, "loss": 1.1803, "step": 764 }, { "epoch": 0.02, "learning_rate": 3.840361445783133e-06, "loss": 1.11, "step": 765 }, { "epoch": 0.02, "learning_rate": 3.845381526104418e-06, "loss": 1.2098, "step": 766 }, { "epoch": 0.02, "learning_rate": 3.850401606425703e-06, "loss": 1.2538, "step": 767 }, { "epoch": 0.02, "learning_rate": 3.855421686746989e-06, "loss": 1.2141, "step": 768 }, { "epoch": 0.02, "learning_rate": 3.860441767068273e-06, "loss": 1.1812, "step": 769 }, { "epoch": 0.02, "learning_rate": 3.865461847389558e-06, "loss": 1.1094, "step": 770 }, { "epoch": 0.02, "learning_rate": 3.870481927710843e-06, "loss": 1.1046, "step": 771 }, { "epoch": 0.02, "learning_rate": 3.875502008032129e-06, "loss": 1.1547, "step": 772 }, { "epoch": 0.02, "learning_rate": 3.8805220883534135e-06, "loss": 1.2114, "step": 773 }, { "epoch": 0.02, "learning_rate": 3.885542168674699e-06, "loss": 1.229, "step": 774 }, { "epoch": 0.02, "learning_rate": 3.8905622489959845e-06, "loss": 1.026, "step": 775 }, { "epoch": 0.02, "learning_rate": 3.89558232931727e-06, "loss": 1.2162, "step": 776 }, { "epoch": 0.02, "learning_rate": 3.9006024096385546e-06, "loss": 1.1267, "step": 777 }, { "epoch": 0.02, "learning_rate": 3.90562248995984e-06, "loss": 1.2231, "step": 778 }, { "epoch": 0.02, "learning_rate": 3.910642570281125e-06, "loss": 1.1613, "step": 779 }, { "epoch": 0.02, "learning_rate": 3.91566265060241e-06, "loss": 1.1917, "step": 780 }, { "epoch": 0.02, "learning_rate": 3.920682730923695e-06, "loss": 1.3037, "step": 781 }, { "epoch": 0.02, "learning_rate": 3.92570281124498e-06, "loss": 1.1561, "step": 782 }, { "epoch": 0.02, "learning_rate": 3.930722891566266e-06, "loss": 1.1202, "step": 783 }, { "epoch": 0.02, "learning_rate": 3.93574297188755e-06, "loss": 1.2013, "step": 784 }, { "epoch": 0.02, "learning_rate": 3.940763052208836e-06, "loss": 1.3037, "step": 785 }, { "epoch": 0.02, "learning_rate": 3.945783132530121e-06, "loss": 1.2101, "step": 786 }, { "epoch": 0.02, "learning_rate": 3.950803212851406e-06, "loss": 1.1733, "step": 787 }, { "epoch": 0.02, "learning_rate": 3.9558232931726905e-06, "loss": 1.0984, "step": 788 }, { "epoch": 0.02, "learning_rate": 3.960843373493976e-06, "loss": 1.2742, "step": 789 }, { "epoch": 0.02, "learning_rate": 3.9658634538152615e-06, "loss": 1.1224, "step": 790 }, { "epoch": 0.02, "learning_rate": 3.970883534136546e-06, "loss": 1.1318, "step": 791 }, { "epoch": 0.02, "learning_rate": 3.975903614457832e-06, "loss": 1.1938, "step": 792 }, { "epoch": 0.02, "learning_rate": 3.980923694779117e-06, "loss": 1.1208, "step": 793 }, { "epoch": 0.02, "learning_rate": 3.985943775100402e-06, "loss": 1.1153, "step": 794 }, { "epoch": 0.02, "learning_rate": 3.990963855421687e-06, "loss": 1.0952, "step": 795 }, { "epoch": 0.02, "learning_rate": 3.995983935742972e-06, "loss": 1.0912, "step": 796 }, { "epoch": 0.02, "learning_rate": 4.001004016064257e-06, "loss": 1.1032, "step": 797 }, { "epoch": 0.02, "learning_rate": 4.006024096385543e-06, "loss": 1.204, "step": 798 }, { "epoch": 0.02, "learning_rate": 4.011044176706827e-06, "loss": 1.2959, "step": 799 }, { "epoch": 0.02, "learning_rate": 4.016064257028113e-06, "loss": 1.1191, "step": 800 }, { "epoch": 0.02, "learning_rate": 4.021084337349398e-06, "loss": 1.2489, "step": 801 }, { "epoch": 0.02, "learning_rate": 4.026104417670683e-06, "loss": 1.1782, "step": 802 }, { "epoch": 0.02, "learning_rate": 4.031124497991968e-06, "loss": 1.1559, "step": 803 }, { "epoch": 0.02, "learning_rate": 4.036144578313254e-06, "loss": 1.1214, "step": 804 }, { "epoch": 0.02, "learning_rate": 4.0411646586345385e-06, "loss": 1.0647, "step": 805 }, { "epoch": 0.02, "learning_rate": 4.046184738955823e-06, "loss": 1.1761, "step": 806 }, { "epoch": 0.02, "learning_rate": 4.051204819277109e-06, "loss": 1.2045, "step": 807 }, { "epoch": 0.02, "learning_rate": 4.056224899598394e-06, "loss": 1.1516, "step": 808 }, { "epoch": 0.02, "learning_rate": 4.061244979919679e-06, "loss": 1.0133, "step": 809 }, { "epoch": 0.02, "learning_rate": 4.066265060240964e-06, "loss": 1.1262, "step": 810 }, { "epoch": 0.02, "learning_rate": 4.07128514056225e-06, "loss": 1.136, "step": 811 }, { "epoch": 0.02, "learning_rate": 4.076305220883534e-06, "loss": 1.2465, "step": 812 }, { "epoch": 0.02, "learning_rate": 4.08132530120482e-06, "loss": 1.121, "step": 813 }, { "epoch": 0.02, "learning_rate": 4.086345381526104e-06, "loss": 1.1965, "step": 814 }, { "epoch": 0.02, "learning_rate": 4.09136546184739e-06, "loss": 1.1956, "step": 815 }, { "epoch": 0.02, "learning_rate": 4.096385542168675e-06, "loss": 1.2074, "step": 816 }, { "epoch": 0.02, "learning_rate": 4.10140562248996e-06, "loss": 1.2259, "step": 817 }, { "epoch": 0.02, "learning_rate": 4.106425702811245e-06, "loss": 1.2367, "step": 818 }, { "epoch": 0.02, "learning_rate": 4.111445783132531e-06, "loss": 1.2288, "step": 819 }, { "epoch": 0.02, "learning_rate": 4.1164658634538155e-06, "loss": 1.0935, "step": 820 }, { "epoch": 0.02, "learning_rate": 4.121485943775101e-06, "loss": 1.1758, "step": 821 }, { "epoch": 0.02, "learning_rate": 4.1265060240963865e-06, "loss": 1.157, "step": 822 }, { "epoch": 0.02, "learning_rate": 4.131526104417671e-06, "loss": 1.2372, "step": 823 }, { "epoch": 0.02, "learning_rate": 4.136546184738956e-06, "loss": 1.1852, "step": 824 }, { "epoch": 0.02, "learning_rate": 4.141566265060241e-06, "loss": 1.2545, "step": 825 }, { "epoch": 0.02, "learning_rate": 4.146586345381527e-06, "loss": 1.1528, "step": 826 }, { "epoch": 0.02, "learning_rate": 4.151606425702811e-06, "loss": 1.2108, "step": 827 }, { "epoch": 0.02, "learning_rate": 4.156626506024097e-06, "loss": 1.2369, "step": 828 }, { "epoch": 0.02, "learning_rate": 4.161646586345382e-06, "loss": 1.1534, "step": 829 }, { "epoch": 0.03, "learning_rate": 4.166666666666667e-06, "loss": 1.1229, "step": 830 }, { "epoch": 0.03, "learning_rate": 4.171686746987952e-06, "loss": 1.1689, "step": 831 }, { "epoch": 0.03, "learning_rate": 4.176706827309237e-06, "loss": 1.2139, "step": 832 }, { "epoch": 0.03, "learning_rate": 4.1817269076305224e-06, "loss": 1.1818, "step": 833 }, { "epoch": 0.03, "learning_rate": 4.186746987951807e-06, "loss": 1.0599, "step": 834 }, { "epoch": 0.03, "learning_rate": 4.1917670682730925e-06, "loss": 1.1351, "step": 835 }, { "epoch": 0.03, "learning_rate": 4.196787148594378e-06, "loss": 1.193, "step": 836 }, { "epoch": 0.03, "learning_rate": 4.201807228915663e-06, "loss": 1.2032, "step": 837 }, { "epoch": 0.03, "learning_rate": 4.206827309236948e-06, "loss": 1.1447, "step": 838 }, { "epoch": 0.03, "learning_rate": 4.211847389558234e-06, "loss": 1.0885, "step": 839 }, { "epoch": 0.03, "learning_rate": 4.216867469879519e-06, "loss": 1.1421, "step": 840 }, { "epoch": 0.03, "learning_rate": 4.221887550200804e-06, "loss": 1.2253, "step": 841 }, { "epoch": 0.03, "learning_rate": 4.226907630522088e-06, "loss": 1.2026, "step": 842 }, { "epoch": 0.03, "learning_rate": 4.231927710843374e-06, "loss": 1.194, "step": 843 }, { "epoch": 0.03, "learning_rate": 4.236947791164659e-06, "loss": 1.187, "step": 844 }, { "epoch": 0.03, "learning_rate": 4.241967871485944e-06, "loss": 1.1255, "step": 845 }, { "epoch": 0.03, "learning_rate": 4.246987951807229e-06, "loss": 1.0867, "step": 846 }, { "epoch": 0.03, "learning_rate": 4.252008032128515e-06, "loss": 1.1239, "step": 847 }, { "epoch": 0.03, "learning_rate": 4.2570281124497995e-06, "loss": 1.1511, "step": 848 }, { "epoch": 0.03, "learning_rate": 4.262048192771085e-06, "loss": 1.2089, "step": 849 }, { "epoch": 0.03, "learning_rate": 4.2670682730923696e-06, "loss": 1.3069, "step": 850 }, { "epoch": 0.03, "learning_rate": 4.272088353413655e-06, "loss": 1.1969, "step": 851 }, { "epoch": 0.03, "learning_rate": 4.27710843373494e-06, "loss": 1.1122, "step": 852 }, { "epoch": 0.03, "learning_rate": 4.282128514056225e-06, "loss": 1.1059, "step": 853 }, { "epoch": 0.03, "learning_rate": 4.287148594377511e-06, "loss": 1.2266, "step": 854 }, { "epoch": 0.03, "learning_rate": 4.292168674698795e-06, "loss": 1.1371, "step": 855 }, { "epoch": 0.03, "learning_rate": 4.297188755020081e-06, "loss": 1.1995, "step": 856 }, { "epoch": 0.03, "learning_rate": 4.302208835341366e-06, "loss": 1.1223, "step": 857 }, { "epoch": 0.03, "learning_rate": 4.307228915662651e-06, "loss": 1.2378, "step": 858 }, { "epoch": 0.03, "learning_rate": 4.312248995983936e-06, "loss": 1.0909, "step": 859 }, { "epoch": 0.03, "learning_rate": 4.317269076305221e-06, "loss": 1.2485, "step": 860 }, { "epoch": 0.03, "learning_rate": 4.322289156626506e-06, "loss": 1.2812, "step": 861 }, { "epoch": 0.03, "learning_rate": 4.327309236947792e-06, "loss": 1.1661, "step": 862 }, { "epoch": 0.03, "learning_rate": 4.3323293172690765e-06, "loss": 1.2351, "step": 863 }, { "epoch": 0.03, "learning_rate": 4.337349397590362e-06, "loss": 1.0648, "step": 864 }, { "epoch": 0.03, "learning_rate": 4.3423694779116474e-06, "loss": 1.2664, "step": 865 }, { "epoch": 0.03, "learning_rate": 4.347389558232932e-06, "loss": 1.1964, "step": 866 }, { "epoch": 0.03, "learning_rate": 4.3524096385542175e-06, "loss": 1.2455, "step": 867 }, { "epoch": 0.03, "learning_rate": 4.357429718875502e-06, "loss": 1.1878, "step": 868 }, { "epoch": 0.03, "learning_rate": 4.362449799196788e-06, "loss": 1.1794, "step": 869 }, { "epoch": 0.03, "learning_rate": 4.367469879518072e-06, "loss": 1.1956, "step": 870 }, { "epoch": 0.03, "learning_rate": 4.372489959839358e-06, "loss": 1.2058, "step": 871 }, { "epoch": 0.03, "learning_rate": 4.377510040160643e-06, "loss": 1.2101, "step": 872 }, { "epoch": 0.03, "learning_rate": 4.382530120481928e-06, "loss": 1.153, "step": 873 }, { "epoch": 0.03, "learning_rate": 4.387550200803213e-06, "loss": 1.2831, "step": 874 }, { "epoch": 0.03, "learning_rate": 4.392570281124499e-06, "loss": 1.2347, "step": 875 }, { "epoch": 0.03, "learning_rate": 4.397590361445783e-06, "loss": 1.1672, "step": 876 }, { "epoch": 0.03, "learning_rate": 4.402610441767068e-06, "loss": 1.2123, "step": 877 }, { "epoch": 0.03, "learning_rate": 4.4076305220883535e-06, "loss": 1.1037, "step": 878 }, { "epoch": 0.03, "learning_rate": 4.412650602409639e-06, "loss": 1.2438, "step": 879 }, { "epoch": 0.03, "learning_rate": 4.4176706827309244e-06, "loss": 0.997, "step": 880 }, { "epoch": 0.03, "learning_rate": 4.422690763052209e-06, "loss": 1.2045, "step": 881 }, { "epoch": 0.03, "learning_rate": 4.4277108433734945e-06, "loss": 1.1196, "step": 882 }, { "epoch": 0.03, "learning_rate": 4.43273092369478e-06, "loss": 1.1945, "step": 883 }, { "epoch": 0.03, "learning_rate": 4.437751004016065e-06, "loss": 1.0784, "step": 884 }, { "epoch": 0.03, "learning_rate": 4.442771084337349e-06, "loss": 1.1674, "step": 885 }, { "epoch": 0.03, "learning_rate": 4.447791164658635e-06, "loss": 1.1193, "step": 886 }, { "epoch": 0.03, "learning_rate": 4.45281124497992e-06, "loss": 1.1965, "step": 887 }, { "epoch": 0.03, "learning_rate": 4.457831325301205e-06, "loss": 1.1005, "step": 888 }, { "epoch": 0.03, "learning_rate": 4.46285140562249e-06, "loss": 1.1612, "step": 889 }, { "epoch": 0.03, "learning_rate": 4.467871485943776e-06, "loss": 1.2306, "step": 890 }, { "epoch": 0.03, "learning_rate": 4.47289156626506e-06, "loss": 1.1507, "step": 891 }, { "epoch": 0.03, "learning_rate": 4.477911646586346e-06, "loss": 1.2439, "step": 892 }, { "epoch": 0.03, "learning_rate": 4.482931726907631e-06, "loss": 1.127, "step": 893 }, { "epoch": 0.03, "learning_rate": 4.487951807228916e-06, "loss": 1.2712, "step": 894 }, { "epoch": 0.03, "learning_rate": 4.492971887550201e-06, "loss": 1.1355, "step": 895 }, { "epoch": 0.03, "learning_rate": 4.497991967871486e-06, "loss": 1.1252, "step": 896 }, { "epoch": 0.03, "learning_rate": 4.5030120481927716e-06, "loss": 1.1775, "step": 897 }, { "epoch": 0.03, "learning_rate": 4.508032128514056e-06, "loss": 1.1984, "step": 898 }, { "epoch": 0.03, "learning_rate": 4.513052208835342e-06, "loss": 1.2047, "step": 899 }, { "epoch": 0.03, "learning_rate": 4.518072289156627e-06, "loss": 1.1887, "step": 900 }, { "epoch": 0.03, "learning_rate": 4.523092369477913e-06, "loss": 1.1821, "step": 901 }, { "epoch": 0.03, "learning_rate": 4.528112449799197e-06, "loss": 1.1843, "step": 902 }, { "epoch": 0.03, "learning_rate": 4.533132530120482e-06, "loss": 1.2064, "step": 903 }, { "epoch": 0.03, "learning_rate": 4.538152610441767e-06, "loss": 1.2113, "step": 904 }, { "epoch": 0.03, "learning_rate": 4.543172690763053e-06, "loss": 1.1174, "step": 905 }, { "epoch": 0.03, "learning_rate": 4.5481927710843374e-06, "loss": 1.2171, "step": 906 }, { "epoch": 0.03, "learning_rate": 4.553212851405623e-06, "loss": 1.1845, "step": 907 }, { "epoch": 0.03, "learning_rate": 4.558232931726908e-06, "loss": 1.1942, "step": 908 }, { "epoch": 0.03, "learning_rate": 4.563253012048193e-06, "loss": 1.1784, "step": 909 }, { "epoch": 0.03, "learning_rate": 4.5682730923694785e-06, "loss": 1.1885, "step": 910 }, { "epoch": 0.03, "learning_rate": 4.573293172690764e-06, "loss": 1.2352, "step": 911 }, { "epoch": 0.03, "learning_rate": 4.578313253012049e-06, "loss": 1.2156, "step": 912 }, { "epoch": 0.03, "learning_rate": 4.583333333333333e-06, "loss": 1.2905, "step": 913 }, { "epoch": 0.03, "learning_rate": 4.588353413654619e-06, "loss": 1.1228, "step": 914 }, { "epoch": 0.03, "learning_rate": 4.593373493975904e-06, "loss": 1.1265, "step": 915 }, { "epoch": 0.03, "learning_rate": 4.598393574297189e-06, "loss": 1.2225, "step": 916 }, { "epoch": 0.03, "learning_rate": 4.603413654618474e-06, "loss": 1.2507, "step": 917 }, { "epoch": 0.03, "learning_rate": 4.60843373493976e-06, "loss": 1.2174, "step": 918 }, { "epoch": 0.03, "learning_rate": 4.613453815261044e-06, "loss": 1.0972, "step": 919 }, { "epoch": 0.03, "learning_rate": 4.61847389558233e-06, "loss": 1.1577, "step": 920 }, { "epoch": 0.03, "learning_rate": 4.6234939759036145e-06, "loss": 1.1324, "step": 921 }, { "epoch": 0.03, "learning_rate": 4.6285140562249e-06, "loss": 1.1468, "step": 922 }, { "epoch": 0.03, "learning_rate": 4.633534136546185e-06, "loss": 1.0754, "step": 923 }, { "epoch": 0.03, "learning_rate": 4.63855421686747e-06, "loss": 1.0976, "step": 924 }, { "epoch": 0.03, "learning_rate": 4.6435742971887555e-06, "loss": 1.2158, "step": 925 }, { "epoch": 0.03, "learning_rate": 4.648594377510041e-06, "loss": 1.1849, "step": 926 }, { "epoch": 0.03, "learning_rate": 4.653614457831326e-06, "loss": 1.1783, "step": 927 }, { "epoch": 0.03, "learning_rate": 4.658634538152611e-06, "loss": 1.1724, "step": 928 }, { "epoch": 0.03, "learning_rate": 4.6636546184738966e-06, "loss": 1.1661, "step": 929 }, { "epoch": 0.03, "learning_rate": 4.668674698795181e-06, "loss": 1.0807, "step": 930 }, { "epoch": 0.03, "learning_rate": 4.673694779116466e-06, "loss": 1.2581, "step": 931 }, { "epoch": 0.03, "learning_rate": 4.678714859437751e-06, "loss": 1.1266, "step": 932 }, { "epoch": 0.03, "learning_rate": 4.683734939759037e-06, "loss": 1.2342, "step": 933 }, { "epoch": 0.03, "learning_rate": 4.688755020080321e-06, "loss": 1.1434, "step": 934 }, { "epoch": 0.03, "learning_rate": 4.693775100401607e-06, "loss": 1.1605, "step": 935 }, { "epoch": 0.03, "learning_rate": 4.698795180722892e-06, "loss": 1.1944, "step": 936 }, { "epoch": 0.03, "learning_rate": 4.703815261044177e-06, "loss": 1.3027, "step": 937 }, { "epoch": 0.03, "learning_rate": 4.7088353413654624e-06, "loss": 1.2478, "step": 938 }, { "epoch": 0.03, "learning_rate": 4.713855421686747e-06, "loss": 1.1047, "step": 939 }, { "epoch": 0.03, "learning_rate": 4.7188755020080325e-06, "loss": 1.2137, "step": 940 }, { "epoch": 0.03, "learning_rate": 4.723895582329317e-06, "loss": 1.1926, "step": 941 }, { "epoch": 0.03, "learning_rate": 4.728915662650603e-06, "loss": 1.301, "step": 942 }, { "epoch": 0.03, "learning_rate": 4.733935742971888e-06, "loss": 1.3237, "step": 943 }, { "epoch": 0.03, "learning_rate": 4.7389558232931736e-06, "loss": 1.1144, "step": 944 }, { "epoch": 0.03, "learning_rate": 4.743975903614458e-06, "loss": 1.1965, "step": 945 }, { "epoch": 0.03, "learning_rate": 4.748995983935744e-06, "loss": 1.1981, "step": 946 }, { "epoch": 0.03, "learning_rate": 4.754016064257029e-06, "loss": 1.2367, "step": 947 }, { "epoch": 0.03, "learning_rate": 4.759036144578314e-06, "loss": 1.2113, "step": 948 }, { "epoch": 0.03, "learning_rate": 4.764056224899598e-06, "loss": 1.092, "step": 949 }, { "epoch": 0.03, "learning_rate": 4.769076305220884e-06, "loss": 1.0604, "step": 950 }, { "epoch": 0.03, "learning_rate": 4.774096385542169e-06, "loss": 1.1526, "step": 951 }, { "epoch": 0.03, "learning_rate": 4.779116465863454e-06, "loss": 1.0151, "step": 952 }, { "epoch": 0.03, "learning_rate": 4.7841365461847394e-06, "loss": 1.1007, "step": 953 }, { "epoch": 0.03, "learning_rate": 4.789156626506025e-06, "loss": 1.1938, "step": 954 }, { "epoch": 0.03, "learning_rate": 4.7941767068273095e-06, "loss": 1.1664, "step": 955 }, { "epoch": 0.03, "learning_rate": 4.799196787148594e-06, "loss": 1.2405, "step": 956 }, { "epoch": 0.03, "learning_rate": 4.80421686746988e-06, "loss": 1.1171, "step": 957 }, { "epoch": 0.03, "learning_rate": 4.809236947791165e-06, "loss": 1.1636, "step": 958 }, { "epoch": 0.03, "learning_rate": 4.81425702811245e-06, "loss": 1.1574, "step": 959 }, { "epoch": 0.03, "learning_rate": 4.819277108433735e-06, "loss": 1.1075, "step": 960 }, { "epoch": 0.03, "learning_rate": 4.824297188755021e-06, "loss": 1.2254, "step": 961 }, { "epoch": 0.03, "learning_rate": 4.829317269076305e-06, "loss": 1.2274, "step": 962 }, { "epoch": 0.03, "learning_rate": 4.834337349397591e-06, "loss": 1.17, "step": 963 }, { "epoch": 0.03, "learning_rate": 4.839357429718876e-06, "loss": 1.1818, "step": 964 }, { "epoch": 0.03, "learning_rate": 4.844377510040161e-06, "loss": 1.215, "step": 965 }, { "epoch": 0.03, "learning_rate": 4.849397590361446e-06, "loss": 1.2313, "step": 966 }, { "epoch": 0.03, "learning_rate": 4.854417670682731e-06, "loss": 1.2126, "step": 967 }, { "epoch": 0.03, "learning_rate": 4.8594377510040165e-06, "loss": 1.3407, "step": 968 }, { "epoch": 0.03, "learning_rate": 4.864457831325302e-06, "loss": 1.0948, "step": 969 }, { "epoch": 0.03, "learning_rate": 4.8694779116465866e-06, "loss": 1.151, "step": 970 }, { "epoch": 0.03, "learning_rate": 4.874497991967872e-06, "loss": 1.1895, "step": 971 }, { "epoch": 0.03, "learning_rate": 4.8795180722891575e-06, "loss": 1.2261, "step": 972 }, { "epoch": 0.03, "learning_rate": 4.884538152610442e-06, "loss": 1.1776, "step": 973 }, { "epoch": 0.03, "learning_rate": 4.889558232931727e-06, "loss": 1.0862, "step": 974 }, { "epoch": 0.03, "learning_rate": 4.894578313253012e-06, "loss": 1.2307, "step": 975 }, { "epoch": 0.03, "learning_rate": 4.899598393574298e-06, "loss": 1.1899, "step": 976 }, { "epoch": 0.03, "learning_rate": 4.904618473895582e-06, "loss": 1.1544, "step": 977 }, { "epoch": 0.03, "learning_rate": 4.909638554216868e-06, "loss": 1.14, "step": 978 }, { "epoch": 0.03, "learning_rate": 4.914658634538153e-06, "loss": 1.147, "step": 979 }, { "epoch": 0.03, "learning_rate": 4.919678714859438e-06, "loss": 1.271, "step": 980 }, { "epoch": 0.03, "learning_rate": 4.924698795180723e-06, "loss": 1.3358, "step": 981 }, { "epoch": 0.03, "learning_rate": 4.929718875502009e-06, "loss": 1.1552, "step": 982 }, { "epoch": 0.03, "learning_rate": 4.9347389558232935e-06, "loss": 1.1945, "step": 983 }, { "epoch": 0.03, "learning_rate": 4.939759036144578e-06, "loss": 1.2268, "step": 984 }, { "epoch": 0.03, "learning_rate": 4.944779116465864e-06, "loss": 1.1343, "step": 985 }, { "epoch": 0.03, "learning_rate": 4.949799196787149e-06, "loss": 1.1038, "step": 986 }, { "epoch": 0.03, "learning_rate": 4.9548192771084345e-06, "loss": 1.14, "step": 987 }, { "epoch": 0.03, "learning_rate": 4.959839357429719e-06, "loss": 1.1661, "step": 988 }, { "epoch": 0.03, "learning_rate": 4.964859437751005e-06, "loss": 1.2185, "step": 989 }, { "epoch": 0.03, "learning_rate": 4.96987951807229e-06, "loss": 1.0518, "step": 990 }, { "epoch": 0.03, "learning_rate": 4.974899598393575e-06, "loss": 1.073, "step": 991 }, { "epoch": 0.03, "learning_rate": 4.979919678714859e-06, "loss": 1.1993, "step": 992 }, { "epoch": 0.03, "learning_rate": 4.984939759036145e-06, "loss": 1.1627, "step": 993 }, { "epoch": 0.03, "learning_rate": 4.98995983935743e-06, "loss": 1.1975, "step": 994 }, { "epoch": 0.03, "learning_rate": 4.994979919678715e-06, "loss": 1.1283, "step": 995 }, { "epoch": 0.03, "learning_rate": 5e-06, "loss": 1.1426, "step": 996 }, { "epoch": 0.03, "learning_rate": 4.999999988100602e-06, "loss": 1.0962, "step": 997 }, { "epoch": 0.03, "learning_rate": 4.999999952402409e-06, "loss": 1.1393, "step": 998 }, { "epoch": 0.03, "learning_rate": 4.999999892905419e-06, "loss": 1.2229, "step": 999 }, { "epoch": 0.03, "learning_rate": 4.999999809609635e-06, "loss": 1.1984, "step": 1000 }, { "epoch": 0.03, "learning_rate": 4.9999997025150566e-06, "loss": 1.1069, "step": 1001 }, { "epoch": 0.03, "learning_rate": 4.9999995716216856e-06, "loss": 1.2445, "step": 1002 }, { "epoch": 0.03, "learning_rate": 4.999999416929522e-06, "loss": 1.1068, "step": 1003 }, { "epoch": 0.03, "learning_rate": 4.999999238438568e-06, "loss": 1.1652, "step": 1004 }, { "epoch": 0.03, "learning_rate": 4.999999036148825e-06, "loss": 1.3651, "step": 1005 }, { "epoch": 0.03, "learning_rate": 4.999998810060296e-06, "loss": 1.2017, "step": 1006 }, { "epoch": 0.03, "learning_rate": 4.999998560172981e-06, "loss": 1.3706, "step": 1007 }, { "epoch": 0.03, "learning_rate": 4.999998286486886e-06, "loss": 1.147, "step": 1008 }, { "epoch": 0.03, "learning_rate": 4.99999798900201e-06, "loss": 1.1786, "step": 1009 }, { "epoch": 0.03, "learning_rate": 4.999997667718357e-06, "loss": 1.1466, "step": 1010 }, { "epoch": 0.03, "learning_rate": 4.999997322635931e-06, "loss": 1.1344, "step": 1011 }, { "epoch": 0.03, "learning_rate": 4.999996953754734e-06, "loss": 1.1438, "step": 1012 }, { "epoch": 0.03, "learning_rate": 4.99999656107477e-06, "loss": 1.1802, "step": 1013 }, { "epoch": 0.03, "learning_rate": 4.9999961445960435e-06, "loss": 1.1579, "step": 1014 }, { "epoch": 0.03, "learning_rate": 4.9999957043185565e-06, "loss": 1.1469, "step": 1015 }, { "epoch": 0.03, "learning_rate": 4.999995240242315e-06, "loss": 1.2335, "step": 1016 }, { "epoch": 0.03, "learning_rate": 4.9999947523673235e-06, "loss": 1.1745, "step": 1017 }, { "epoch": 0.03, "learning_rate": 4.999994240693585e-06, "loss": 1.186, "step": 1018 }, { "epoch": 0.03, "learning_rate": 4.999993705221106e-06, "loss": 1.239, "step": 1019 }, { "epoch": 0.03, "learning_rate": 4.999993145949891e-06, "loss": 1.24, "step": 1020 }, { "epoch": 0.03, "learning_rate": 4.999992562879945e-06, "loss": 1.0895, "step": 1021 }, { "epoch": 0.03, "learning_rate": 4.999991956011274e-06, "loss": 1.2142, "step": 1022 }, { "epoch": 0.03, "learning_rate": 4.999991325343883e-06, "loss": 1.2047, "step": 1023 }, { "epoch": 0.03, "learning_rate": 4.999990670877779e-06, "loss": 1.1187, "step": 1024 }, { "epoch": 0.03, "learning_rate": 4.999989992612968e-06, "loss": 1.1071, "step": 1025 }, { "epoch": 0.03, "learning_rate": 4.999989290549456e-06, "loss": 1.1879, "step": 1026 }, { "epoch": 0.03, "learning_rate": 4.999988564687251e-06, "loss": 1.1371, "step": 1027 }, { "epoch": 0.03, "learning_rate": 4.999987815026358e-06, "loss": 1.0531, "step": 1028 }, { "epoch": 0.03, "learning_rate": 4.999987041566785e-06, "loss": 1.2164, "step": 1029 }, { "epoch": 0.03, "learning_rate": 4.99998624430854e-06, "loss": 1.1174, "step": 1030 }, { "epoch": 0.03, "learning_rate": 4.9999854232516295e-06, "loss": 1.2925, "step": 1031 }, { "epoch": 0.03, "learning_rate": 4.999984578396062e-06, "loss": 1.2159, "step": 1032 }, { "epoch": 0.03, "learning_rate": 4.9999837097418455e-06, "loss": 1.2043, "step": 1033 }, { "epoch": 0.03, "learning_rate": 4.9999828172889875e-06, "loss": 1.1185, "step": 1034 }, { "epoch": 0.03, "learning_rate": 4.999981901037498e-06, "loss": 1.1368, "step": 1035 }, { "epoch": 0.03, "learning_rate": 4.999980960987384e-06, "loss": 1.0931, "step": 1036 }, { "epoch": 0.03, "learning_rate": 4.999979997138656e-06, "loss": 1.1481, "step": 1037 }, { "epoch": 0.03, "learning_rate": 4.9999790094913214e-06, "loss": 1.1769, "step": 1038 }, { "epoch": 0.03, "learning_rate": 4.999977998045391e-06, "loss": 1.1815, "step": 1039 }, { "epoch": 0.03, "learning_rate": 4.999976962800875e-06, "loss": 1.1688, "step": 1040 }, { "epoch": 0.03, "learning_rate": 4.999975903757782e-06, "loss": 1.2178, "step": 1041 }, { "epoch": 0.03, "learning_rate": 4.999974820916122e-06, "loss": 1.3155, "step": 1042 }, { "epoch": 0.03, "learning_rate": 4.9999737142759054e-06, "loss": 1.1658, "step": 1043 }, { "epoch": 0.03, "learning_rate": 4.999972583837144e-06, "loss": 1.2227, "step": 1044 }, { "epoch": 0.03, "learning_rate": 4.999971429599847e-06, "loss": 1.2305, "step": 1045 }, { "epoch": 0.03, "learning_rate": 4.999970251564027e-06, "loss": 1.1798, "step": 1046 }, { "epoch": 0.03, "learning_rate": 4.999969049729693e-06, "loss": 1.2107, "step": 1047 }, { "epoch": 0.03, "learning_rate": 4.999967824096859e-06, "loss": 1.229, "step": 1048 }, { "epoch": 0.03, "learning_rate": 4.999966574665534e-06, "loss": 1.2759, "step": 1049 }, { "epoch": 0.03, "learning_rate": 4.999965301435731e-06, "loss": 1.267, "step": 1050 }, { "epoch": 0.03, "learning_rate": 4.999964004407463e-06, "loss": 1.2127, "step": 1051 }, { "epoch": 0.03, "learning_rate": 4.9999626835807426e-06, "loss": 1.2075, "step": 1052 }, { "epoch": 0.03, "learning_rate": 4.99996133895558e-06, "loss": 1.2308, "step": 1053 }, { "epoch": 0.03, "learning_rate": 4.99995997053199e-06, "loss": 1.1908, "step": 1054 }, { "epoch": 0.03, "learning_rate": 4.999958578309986e-06, "loss": 1.246, "step": 1055 }, { "epoch": 0.03, "learning_rate": 4.999957162289579e-06, "loss": 1.2063, "step": 1056 }, { "epoch": 0.03, "learning_rate": 4.999955722470785e-06, "loss": 1.2684, "step": 1057 }, { "epoch": 0.03, "learning_rate": 4.9999542588536155e-06, "loss": 1.2144, "step": 1058 }, { "epoch": 0.03, "learning_rate": 4.999952771438086e-06, "loss": 1.215, "step": 1059 }, { "epoch": 0.03, "learning_rate": 4.999951260224211e-06, "loss": 1.1271, "step": 1060 }, { "epoch": 0.03, "learning_rate": 4.999949725212002e-06, "loss": 1.1584, "step": 1061 }, { "epoch": 0.03, "learning_rate": 4.999948166401477e-06, "loss": 1.2246, "step": 1062 }, { "epoch": 0.03, "learning_rate": 4.9999465837926495e-06, "loss": 1.2926, "step": 1063 }, { "epoch": 0.03, "learning_rate": 4.999944977385534e-06, "loss": 1.2111, "step": 1064 }, { "epoch": 0.03, "learning_rate": 4.999943347180146e-06, "loss": 1.1289, "step": 1065 }, { "epoch": 0.03, "learning_rate": 4.999941693176502e-06, "loss": 1.1743, "step": 1066 }, { "epoch": 0.03, "learning_rate": 4.9999400153746174e-06, "loss": 1.2651, "step": 1067 }, { "epoch": 0.03, "learning_rate": 4.999938313774507e-06, "loss": 1.2295, "step": 1068 }, { "epoch": 0.03, "learning_rate": 4.999936588376189e-06, "loss": 1.2891, "step": 1069 }, { "epoch": 0.03, "learning_rate": 4.999934839179678e-06, "loss": 1.2282, "step": 1070 }, { "epoch": 0.03, "learning_rate": 4.999933066184991e-06, "loss": 1.0869, "step": 1071 }, { "epoch": 0.03, "learning_rate": 4.999931269392146e-06, "loss": 1.1109, "step": 1072 }, { "epoch": 0.03, "learning_rate": 4.999929448801159e-06, "loss": 1.2327, "step": 1073 }, { "epoch": 0.03, "learning_rate": 4.999927604412047e-06, "loss": 1.2316, "step": 1074 }, { "epoch": 0.03, "learning_rate": 4.999925736224829e-06, "loss": 1.134, "step": 1075 }, { "epoch": 0.03, "learning_rate": 4.999923844239522e-06, "loss": 1.2374, "step": 1076 }, { "epoch": 0.03, "learning_rate": 4.999921928456144e-06, "loss": 1.0983, "step": 1077 }, { "epoch": 0.03, "learning_rate": 4.9999199888747126e-06, "loss": 1.2, "step": 1078 }, { "epoch": 0.03, "learning_rate": 4.999918025495247e-06, "loss": 1.1359, "step": 1079 }, { "epoch": 0.03, "learning_rate": 4.999916038317767e-06, "loss": 1.1466, "step": 1080 }, { "epoch": 0.03, "learning_rate": 4.999914027342289e-06, "loss": 1.1652, "step": 1081 }, { "epoch": 0.03, "learning_rate": 4.999911992568835e-06, "loss": 1.2798, "step": 1082 }, { "epoch": 0.03, "learning_rate": 4.999909933997421e-06, "loss": 1.1194, "step": 1083 }, { "epoch": 0.03, "learning_rate": 4.999907851628069e-06, "loss": 1.1921, "step": 1084 }, { "epoch": 0.03, "learning_rate": 4.999905745460798e-06, "loss": 1.1752, "step": 1085 }, { "epoch": 0.03, "learning_rate": 4.999903615495629e-06, "loss": 1.0582, "step": 1086 }, { "epoch": 0.03, "learning_rate": 4.999901461732581e-06, "loss": 1.2693, "step": 1087 }, { "epoch": 0.03, "learning_rate": 4.9998992841716755e-06, "loss": 1.1343, "step": 1088 }, { "epoch": 0.03, "learning_rate": 4.999897082812933e-06, "loss": 1.1774, "step": 1089 }, { "epoch": 0.03, "learning_rate": 4.999894857656374e-06, "loss": 1.1225, "step": 1090 }, { "epoch": 0.03, "learning_rate": 4.99989260870202e-06, "loss": 1.2132, "step": 1091 }, { "epoch": 0.03, "learning_rate": 4.999890335949892e-06, "loss": 1.252, "step": 1092 }, { "epoch": 0.03, "learning_rate": 4.999888039400013e-06, "loss": 1.3153, "step": 1093 }, { "epoch": 0.03, "learning_rate": 4.999885719052402e-06, "loss": 1.1531, "step": 1094 }, { "epoch": 0.03, "learning_rate": 4.9998833749070844e-06, "loss": 1.1693, "step": 1095 }, { "epoch": 0.03, "learning_rate": 4.999881006964081e-06, "loss": 1.1575, "step": 1096 }, { "epoch": 0.03, "learning_rate": 4.999878615223414e-06, "loss": 1.0947, "step": 1097 }, { "epoch": 0.03, "learning_rate": 4.9998761996851064e-06, "loss": 1.0804, "step": 1098 }, { "epoch": 0.03, "learning_rate": 4.9998737603491824e-06, "loss": 1.1156, "step": 1099 }, { "epoch": 0.03, "learning_rate": 4.999871297215663e-06, "loss": 1.3231, "step": 1100 }, { "epoch": 0.03, "learning_rate": 4.999868810284573e-06, "loss": 1.1637, "step": 1101 }, { "epoch": 0.03, "learning_rate": 4.999866299555936e-06, "loss": 1.0512, "step": 1102 }, { "epoch": 0.03, "learning_rate": 4.999863765029776e-06, "loss": 1.1562, "step": 1103 }, { "epoch": 0.03, "learning_rate": 4.999861206706117e-06, "loss": 1.3119, "step": 1104 }, { "epoch": 0.03, "learning_rate": 4.999858624584983e-06, "loss": 1.1174, "step": 1105 }, { "epoch": 0.03, "learning_rate": 4.9998560186663995e-06, "loss": 1.1951, "step": 1106 }, { "epoch": 0.03, "learning_rate": 4.99985338895039e-06, "loss": 1.2593, "step": 1107 }, { "epoch": 0.03, "learning_rate": 4.99985073543698e-06, "loss": 1.2359, "step": 1108 }, { "epoch": 0.03, "learning_rate": 4.999848058126196e-06, "loss": 1.167, "step": 1109 }, { "epoch": 0.03, "learning_rate": 4.999845357018061e-06, "loss": 1.1573, "step": 1110 }, { "epoch": 0.03, "learning_rate": 4.999842632112603e-06, "loss": 1.1613, "step": 1111 }, { "epoch": 0.03, "learning_rate": 4.999839883409847e-06, "loss": 1.2385, "step": 1112 }, { "epoch": 0.03, "learning_rate": 4.99983711090982e-06, "loss": 1.1591, "step": 1113 }, { "epoch": 0.03, "learning_rate": 4.999834314612547e-06, "loss": 1.1066, "step": 1114 }, { "epoch": 0.03, "learning_rate": 4.999831494518055e-06, "loss": 1.1952, "step": 1115 }, { "epoch": 0.03, "learning_rate": 4.999828650626372e-06, "loss": 1.2571, "step": 1116 }, { "epoch": 0.03, "learning_rate": 4.999825782937523e-06, "loss": 1.131, "step": 1117 }, { "epoch": 0.03, "learning_rate": 4.999822891451537e-06, "loss": 1.3179, "step": 1118 }, { "epoch": 0.03, "learning_rate": 4.999819976168442e-06, "loss": 1.1736, "step": 1119 }, { "epoch": 0.03, "learning_rate": 4.999817037088264e-06, "loss": 1.1879, "step": 1120 }, { "epoch": 0.03, "learning_rate": 4.9998140742110315e-06, "loss": 1.1242, "step": 1121 }, { "epoch": 0.03, "learning_rate": 4.999811087536773e-06, "loss": 1.1285, "step": 1122 }, { "epoch": 0.03, "learning_rate": 4.9998080770655175e-06, "loss": 0.9915, "step": 1123 }, { "epoch": 0.03, "learning_rate": 4.999805042797292e-06, "loss": 1.0958, "step": 1124 }, { "epoch": 0.03, "learning_rate": 4.999801984732127e-06, "loss": 1.3636, "step": 1125 }, { "epoch": 0.03, "learning_rate": 4.9997989028700515e-06, "loss": 1.1879, "step": 1126 }, { "epoch": 0.03, "learning_rate": 4.999795797211094e-06, "loss": 1.0811, "step": 1127 }, { "epoch": 0.03, "learning_rate": 4.999792667755285e-06, "loss": 1.1453, "step": 1128 }, { "epoch": 0.03, "learning_rate": 4.999789514502653e-06, "loss": 1.1284, "step": 1129 }, { "epoch": 0.03, "learning_rate": 4.9997863374532285e-06, "loss": 1.1063, "step": 1130 }, { "epoch": 0.03, "learning_rate": 4.999783136607043e-06, "loss": 1.2442, "step": 1131 }, { "epoch": 0.03, "learning_rate": 4.9997799119641256e-06, "loss": 1.2732, "step": 1132 }, { "epoch": 0.03, "learning_rate": 4.999776663524507e-06, "loss": 1.1505, "step": 1133 }, { "epoch": 0.03, "learning_rate": 4.999773391288219e-06, "loss": 1.1156, "step": 1134 }, { "epoch": 0.03, "learning_rate": 4.999770095255292e-06, "loss": 1.0813, "step": 1135 }, { "epoch": 0.03, "learning_rate": 4.999766775425757e-06, "loss": 1.0895, "step": 1136 }, { "epoch": 0.03, "learning_rate": 4.9997634317996465e-06, "loss": 1.136, "step": 1137 }, { "epoch": 0.03, "learning_rate": 4.999760064376993e-06, "loss": 1.1395, "step": 1138 }, { "epoch": 0.03, "learning_rate": 4.9997566731578275e-06, "loss": 1.2229, "step": 1139 }, { "epoch": 0.03, "learning_rate": 4.999753258142182e-06, "loss": 1.1729, "step": 1140 }, { "epoch": 0.03, "learning_rate": 4.999749819330089e-06, "loss": 1.1469, "step": 1141 }, { "epoch": 0.03, "learning_rate": 4.999746356721582e-06, "loss": 1.0867, "step": 1142 }, { "epoch": 0.03, "learning_rate": 4.999742870316693e-06, "loss": 1.1945, "step": 1143 }, { "epoch": 0.03, "learning_rate": 4.999739360115457e-06, "loss": 1.1962, "step": 1144 }, { "epoch": 0.03, "learning_rate": 4.999735826117905e-06, "loss": 1.2247, "step": 1145 }, { "epoch": 0.03, "learning_rate": 4.999732268324073e-06, "loss": 1.2083, "step": 1146 }, { "epoch": 0.03, "learning_rate": 4.999728686733993e-06, "loss": 1.2275, "step": 1147 }, { "epoch": 0.03, "learning_rate": 4.9997250813477e-06, "loss": 1.1683, "step": 1148 }, { "epoch": 0.03, "learning_rate": 4.999721452165227e-06, "loss": 1.3231, "step": 1149 }, { "epoch": 0.03, "learning_rate": 4.999717799186611e-06, "loss": 1.1262, "step": 1150 }, { "epoch": 0.03, "learning_rate": 4.999714122411886e-06, "loss": 1.2104, "step": 1151 }, { "epoch": 0.03, "learning_rate": 4.999710421841085e-06, "loss": 1.2039, "step": 1152 }, { "epoch": 0.03, "learning_rate": 4.999706697474246e-06, "loss": 1.1599, "step": 1153 }, { "epoch": 0.03, "learning_rate": 4.9997029493114025e-06, "loss": 1.2271, "step": 1154 }, { "epoch": 0.03, "learning_rate": 4.999699177352591e-06, "loss": 1.2039, "step": 1155 }, { "epoch": 0.03, "learning_rate": 4.999695381597847e-06, "loss": 1.2529, "step": 1156 }, { "epoch": 0.03, "learning_rate": 4.999691562047206e-06, "loss": 1.1265, "step": 1157 }, { "epoch": 0.03, "learning_rate": 4.999687718700707e-06, "loss": 1.1567, "step": 1158 }, { "epoch": 0.03, "learning_rate": 4.999683851558383e-06, "loss": 1.1328, "step": 1159 }, { "epoch": 0.03, "learning_rate": 4.999679960620274e-06, "loss": 1.2083, "step": 1160 }, { "epoch": 0.03, "learning_rate": 4.999676045886415e-06, "loss": 1.2819, "step": 1161 }, { "epoch": 0.04, "learning_rate": 4.999672107356844e-06, "loss": 1.1095, "step": 1162 }, { "epoch": 0.04, "learning_rate": 4.999668145031598e-06, "loss": 1.1825, "step": 1163 }, { "epoch": 0.04, "learning_rate": 4.999664158910717e-06, "loss": 1.1627, "step": 1164 }, { "epoch": 0.04, "learning_rate": 4.999660148994235e-06, "loss": 1.094, "step": 1165 }, { "epoch": 0.04, "learning_rate": 4.999656115282194e-06, "loss": 1.1273, "step": 1166 }, { "epoch": 0.04, "learning_rate": 4.999652057774629e-06, "loss": 1.1158, "step": 1167 }, { "epoch": 0.04, "learning_rate": 4.999647976471581e-06, "loss": 1.2076, "step": 1168 }, { "epoch": 0.04, "learning_rate": 4.999643871373089e-06, "loss": 1.1868, "step": 1169 }, { "epoch": 0.04, "learning_rate": 4.99963974247919e-06, "loss": 1.2659, "step": 1170 }, { "epoch": 0.04, "learning_rate": 4.999635589789925e-06, "loss": 1.1815, "step": 1171 }, { "epoch": 0.04, "learning_rate": 4.999631413305332e-06, "loss": 1.1712, "step": 1172 }, { "epoch": 0.04, "learning_rate": 4.999627213025453e-06, "loss": 1.2735, "step": 1173 }, { "epoch": 0.04, "learning_rate": 4.999622988950326e-06, "loss": 1.138, "step": 1174 }, { "epoch": 0.04, "learning_rate": 4.9996187410799934e-06, "loss": 1.1069, "step": 1175 }, { "epoch": 0.04, "learning_rate": 4.999614469414493e-06, "loss": 1.1376, "step": 1176 }, { "epoch": 0.04, "learning_rate": 4.9996101739538674e-06, "loss": 1.2384, "step": 1177 }, { "epoch": 0.04, "learning_rate": 4.9996058546981565e-06, "loss": 1.1655, "step": 1178 }, { "epoch": 0.04, "learning_rate": 4.999601511647401e-06, "loss": 1.1713, "step": 1179 }, { "epoch": 0.04, "learning_rate": 4.999597144801645e-06, "loss": 1.245, "step": 1180 }, { "epoch": 0.04, "learning_rate": 4.999592754160925e-06, "loss": 1.2135, "step": 1181 }, { "epoch": 0.04, "learning_rate": 4.999588339725289e-06, "loss": 1.169, "step": 1182 }, { "epoch": 0.04, "learning_rate": 4.999583901494774e-06, "loss": 1.1592, "step": 1183 }, { "epoch": 0.04, "learning_rate": 4.999579439469424e-06, "loss": 1.1116, "step": 1184 }, { "epoch": 0.04, "learning_rate": 4.999574953649282e-06, "loss": 1.26, "step": 1185 }, { "epoch": 0.04, "learning_rate": 4.999570444034391e-06, "loss": 1.2175, "step": 1186 }, { "epoch": 0.04, "learning_rate": 4.9995659106247924e-06, "loss": 1.2877, "step": 1187 }, { "epoch": 0.04, "learning_rate": 4.99956135342053e-06, "loss": 1.1498, "step": 1188 }, { "epoch": 0.04, "learning_rate": 4.999556772421648e-06, "loss": 1.1068, "step": 1189 }, { "epoch": 0.04, "learning_rate": 4.999552167628189e-06, "loss": 1.1841, "step": 1190 }, { "epoch": 0.04, "learning_rate": 4.999547539040197e-06, "loss": 1.1891, "step": 1191 }, { "epoch": 0.04, "learning_rate": 4.999542886657717e-06, "loss": 1.1678, "step": 1192 }, { "epoch": 0.04, "learning_rate": 4.999538210480791e-06, "loss": 1.1044, "step": 1193 }, { "epoch": 0.04, "learning_rate": 4.9995335105094666e-06, "loss": 1.1766, "step": 1194 }, { "epoch": 0.04, "learning_rate": 4.999528786743786e-06, "loss": 1.2372, "step": 1195 }, { "epoch": 0.04, "learning_rate": 4.999524039183796e-06, "loss": 1.2316, "step": 1196 }, { "epoch": 0.04, "learning_rate": 4.99951926782954e-06, "loss": 1.1304, "step": 1197 }, { "epoch": 0.04, "learning_rate": 4.9995144726810655e-06, "loss": 1.2412, "step": 1198 }, { "epoch": 0.04, "learning_rate": 4.999509653738416e-06, "loss": 1.2106, "step": 1199 }, { "epoch": 0.04, "learning_rate": 4.999504811001639e-06, "loss": 1.354, "step": 1200 }, { "epoch": 0.04, "learning_rate": 4.99949994447078e-06, "loss": 1.1395, "step": 1201 }, { "epoch": 0.04, "learning_rate": 4.9994950541458855e-06, "loss": 1.1293, "step": 1202 }, { "epoch": 0.04, "learning_rate": 4.999490140027001e-06, "loss": 1.2606, "step": 1203 }, { "epoch": 0.04, "learning_rate": 4.999485202114175e-06, "loss": 1.3185, "step": 1204 }, { "epoch": 0.04, "learning_rate": 4.999480240407453e-06, "loss": 1.1711, "step": 1205 }, { "epoch": 0.04, "learning_rate": 4.999475254906884e-06, "loss": 1.3495, "step": 1206 }, { "epoch": 0.04, "learning_rate": 4.999470245612513e-06, "loss": 1.1733, "step": 1207 }, { "epoch": 0.04, "learning_rate": 4.999465212524389e-06, "loss": 1.1832, "step": 1208 }, { "epoch": 0.04, "learning_rate": 4.9994601556425615e-06, "loss": 1.1779, "step": 1209 }, { "epoch": 0.04, "learning_rate": 4.999455074967076e-06, "loss": 1.1512, "step": 1210 }, { "epoch": 0.04, "learning_rate": 4.999449970497982e-06, "loss": 1.2108, "step": 1211 }, { "epoch": 0.04, "learning_rate": 4.999444842235328e-06, "loss": 1.0408, "step": 1212 }, { "epoch": 0.04, "learning_rate": 4.999439690179164e-06, "loss": 1.1809, "step": 1213 }, { "epoch": 0.04, "learning_rate": 4.999434514329537e-06, "loss": 1.2138, "step": 1214 }, { "epoch": 0.04, "learning_rate": 4.999429314686497e-06, "loss": 1.1673, "step": 1215 }, { "epoch": 0.04, "learning_rate": 4.999424091250094e-06, "loss": 1.1631, "step": 1216 }, { "epoch": 0.04, "learning_rate": 4.999418844020377e-06, "loss": 1.0941, "step": 1217 }, { "epoch": 0.04, "learning_rate": 4.999413572997397e-06, "loss": 1.1931, "step": 1218 }, { "epoch": 0.04, "learning_rate": 4.999408278181204e-06, "loss": 1.1434, "step": 1219 }, { "epoch": 0.04, "learning_rate": 4.9994029595718465e-06, "loss": 1.1359, "step": 1220 }, { "epoch": 0.04, "learning_rate": 4.999397617169378e-06, "loss": 1.1174, "step": 1221 }, { "epoch": 0.04, "learning_rate": 4.999392250973847e-06, "loss": 1.2052, "step": 1222 }, { "epoch": 0.04, "learning_rate": 4.999386860985306e-06, "loss": 1.0711, "step": 1223 }, { "epoch": 0.04, "learning_rate": 4.999381447203805e-06, "loss": 1.2848, "step": 1224 }, { "epoch": 0.04, "learning_rate": 4.999376009629398e-06, "loss": 1.1804, "step": 1225 }, { "epoch": 0.04, "learning_rate": 4.999370548262133e-06, "loss": 1.1987, "step": 1226 }, { "epoch": 0.04, "learning_rate": 4.999365063102065e-06, "loss": 1.2681, "step": 1227 }, { "epoch": 0.04, "learning_rate": 4.999359554149246e-06, "loss": 1.2072, "step": 1228 }, { "epoch": 0.04, "learning_rate": 4.999354021403727e-06, "loss": 1.1793, "step": 1229 }, { "epoch": 0.04, "learning_rate": 4.999348464865562e-06, "loss": 1.1714, "step": 1230 }, { "epoch": 0.04, "learning_rate": 4.999342884534804e-06, "loss": 1.2401, "step": 1231 }, { "epoch": 0.04, "learning_rate": 4.999337280411503e-06, "loss": 1.2133, "step": 1232 }, { "epoch": 0.04, "learning_rate": 4.999331652495717e-06, "loss": 1.1494, "step": 1233 }, { "epoch": 0.04, "learning_rate": 4.999326000787497e-06, "loss": 1.1611, "step": 1234 }, { "epoch": 0.04, "learning_rate": 4.999320325286897e-06, "loss": 1.1602, "step": 1235 }, { "epoch": 0.04, "learning_rate": 4.999314625993971e-06, "loss": 1.2863, "step": 1236 }, { "epoch": 0.04, "learning_rate": 4.999308902908774e-06, "loss": 1.1766, "step": 1237 }, { "epoch": 0.04, "learning_rate": 4.9993031560313594e-06, "loss": 1.103, "step": 1238 }, { "epoch": 0.04, "learning_rate": 4.999297385361783e-06, "loss": 1.2174, "step": 1239 }, { "epoch": 0.04, "learning_rate": 4.999291590900099e-06, "loss": 1.2678, "step": 1240 }, { "epoch": 0.04, "learning_rate": 4.9992857726463626e-06, "loss": 1.1274, "step": 1241 }, { "epoch": 0.04, "learning_rate": 4.999279930600629e-06, "loss": 1.1638, "step": 1242 }, { "epoch": 0.04, "learning_rate": 4.999274064762954e-06, "loss": 1.1029, "step": 1243 }, { "epoch": 0.04, "learning_rate": 4.999268175133395e-06, "loss": 1.1553, "step": 1244 }, { "epoch": 0.04, "learning_rate": 4.999262261712006e-06, "loss": 1.0764, "step": 1245 }, { "epoch": 0.04, "learning_rate": 4.999256324498843e-06, "loss": 1.173, "step": 1246 }, { "epoch": 0.04, "learning_rate": 4.999250363493964e-06, "loss": 0.9943, "step": 1247 }, { "epoch": 0.04, "learning_rate": 4.999244378697425e-06, "loss": 1.2067, "step": 1248 }, { "epoch": 0.04, "learning_rate": 4.999238370109284e-06, "loss": 1.2059, "step": 1249 }, { "epoch": 0.04, "learning_rate": 4.999232337729597e-06, "loss": 1.1521, "step": 1250 }, { "epoch": 0.04, "learning_rate": 4.999226281558423e-06, "loss": 1.1582, "step": 1251 }, { "epoch": 0.04, "learning_rate": 4.999220201595816e-06, "loss": 1.1216, "step": 1252 }, { "epoch": 0.04, "learning_rate": 4.999214097841838e-06, "loss": 1.2056, "step": 1253 }, { "epoch": 0.04, "learning_rate": 4.999207970296545e-06, "loss": 1.1163, "step": 1254 }, { "epoch": 0.04, "learning_rate": 4.999201818959996e-06, "loss": 1.2896, "step": 1255 }, { "epoch": 0.04, "learning_rate": 4.99919564383225e-06, "loss": 1.2651, "step": 1256 }, { "epoch": 0.04, "learning_rate": 4.999189444913364e-06, "loss": 1.1967, "step": 1257 }, { "epoch": 0.04, "learning_rate": 4.999183222203398e-06, "loss": 1.1393, "step": 1258 }, { "epoch": 0.04, "learning_rate": 4.999176975702413e-06, "loss": 1.171, "step": 1259 }, { "epoch": 0.04, "learning_rate": 4.999170705410464e-06, "loss": 1.1812, "step": 1260 }, { "epoch": 0.04, "learning_rate": 4.999164411327616e-06, "loss": 1.1964, "step": 1261 }, { "epoch": 0.04, "learning_rate": 4.999158093453925e-06, "loss": 1.043, "step": 1262 }, { "epoch": 0.04, "learning_rate": 4.999151751789454e-06, "loss": 1.1852, "step": 1263 }, { "epoch": 0.04, "learning_rate": 4.999145386334261e-06, "loss": 1.2063, "step": 1264 }, { "epoch": 0.04, "learning_rate": 4.999138997088407e-06, "loss": 1.202, "step": 1265 }, { "epoch": 0.04, "learning_rate": 4.999132584051954e-06, "loss": 1.1888, "step": 1266 }, { "epoch": 0.04, "learning_rate": 4.999126147224963e-06, "loss": 1.19, "step": 1267 }, { "epoch": 0.04, "learning_rate": 4.999119686607494e-06, "loss": 1.2333, "step": 1268 }, { "epoch": 0.04, "learning_rate": 4.9991132021996105e-06, "loss": 1.1625, "step": 1269 }, { "epoch": 0.04, "learning_rate": 4.999106694001371e-06, "loss": 1.2666, "step": 1270 }, { "epoch": 0.04, "learning_rate": 4.999100162012841e-06, "loss": 1.1904, "step": 1271 }, { "epoch": 0.04, "learning_rate": 4.99909360623408e-06, "loss": 1.2199, "step": 1272 }, { "epoch": 0.04, "learning_rate": 4.9990870266651515e-06, "loss": 1.182, "step": 1273 }, { "epoch": 0.04, "learning_rate": 4.9990804233061185e-06, "loss": 1.2786, "step": 1274 }, { "epoch": 0.04, "learning_rate": 4.999073796157044e-06, "loss": 1.2375, "step": 1275 }, { "epoch": 0.04, "learning_rate": 4.99906714521799e-06, "loss": 1.1514, "step": 1276 }, { "epoch": 0.04, "learning_rate": 4.99906047048902e-06, "loss": 1.1731, "step": 1277 }, { "epoch": 0.04, "learning_rate": 4.9990537719701986e-06, "loss": 1.1437, "step": 1278 }, { "epoch": 0.04, "learning_rate": 4.999047049661588e-06, "loss": 1.1893, "step": 1279 }, { "epoch": 0.04, "learning_rate": 4.999040303563253e-06, "loss": 1.27, "step": 1280 }, { "epoch": 0.04, "learning_rate": 4.999033533675258e-06, "loss": 1.0272, "step": 1281 }, { "epoch": 0.04, "learning_rate": 4.999026739997668e-06, "loss": 1.0569, "step": 1282 }, { "epoch": 0.04, "learning_rate": 4.999019922530547e-06, "loss": 1.1085, "step": 1283 }, { "epoch": 0.04, "learning_rate": 4.99901308127396e-06, "loss": 1.2321, "step": 1284 }, { "epoch": 0.04, "learning_rate": 4.999006216227972e-06, "loss": 1.1481, "step": 1285 }, { "epoch": 0.04, "learning_rate": 4.998999327392648e-06, "loss": 1.2579, "step": 1286 }, { "epoch": 0.04, "learning_rate": 4.998992414768054e-06, "loss": 1.1197, "step": 1287 }, { "epoch": 0.04, "learning_rate": 4.998985478354255e-06, "loss": 1.1748, "step": 1288 }, { "epoch": 0.04, "learning_rate": 4.998978518151319e-06, "loss": 1.3066, "step": 1289 }, { "epoch": 0.04, "learning_rate": 4.998971534159311e-06, "loss": 1.1998, "step": 1290 }, { "epoch": 0.04, "learning_rate": 4.998964526378297e-06, "loss": 1.1135, "step": 1291 }, { "epoch": 0.04, "learning_rate": 4.998957494808345e-06, "loss": 1.0623, "step": 1292 }, { "epoch": 0.04, "learning_rate": 4.998950439449521e-06, "loss": 1.228, "step": 1293 }, { "epoch": 0.04, "learning_rate": 4.998943360301891e-06, "loss": 1.1464, "step": 1294 }, { "epoch": 0.04, "learning_rate": 4.9989362573655255e-06, "loss": 1.3088, "step": 1295 }, { "epoch": 0.04, "learning_rate": 4.998929130640489e-06, "loss": 1.1648, "step": 1296 }, { "epoch": 0.04, "learning_rate": 4.998921980126852e-06, "loss": 1.2195, "step": 1297 }, { "epoch": 0.04, "learning_rate": 4.99891480582468e-06, "loss": 1.3085, "step": 1298 }, { "epoch": 0.04, "learning_rate": 4.998907607734044e-06, "loss": 1.2379, "step": 1299 }, { "epoch": 0.04, "learning_rate": 4.998900385855009e-06, "loss": 1.1582, "step": 1300 }, { "epoch": 0.04, "learning_rate": 4.998893140187647e-06, "loss": 1.1902, "step": 1301 }, { "epoch": 0.04, "learning_rate": 4.9988858707320265e-06, "loss": 1.1809, "step": 1302 }, { "epoch": 0.04, "learning_rate": 4.998878577488216e-06, "loss": 1.0931, "step": 1303 }, { "epoch": 0.04, "learning_rate": 4.998871260456284e-06, "loss": 1.2208, "step": 1304 }, { "epoch": 0.04, "learning_rate": 4.998863919636301e-06, "loss": 1.1002, "step": 1305 }, { "epoch": 0.04, "learning_rate": 4.998856555028337e-06, "loss": 1.2803, "step": 1306 }, { "epoch": 0.04, "learning_rate": 4.9988491666324636e-06, "loss": 1.1996, "step": 1307 }, { "epoch": 0.04, "learning_rate": 4.998841754448749e-06, "loss": 1.2308, "step": 1308 }, { "epoch": 0.04, "learning_rate": 4.998834318477263e-06, "loss": 1.1825, "step": 1309 }, { "epoch": 0.04, "learning_rate": 4.998826858718079e-06, "loss": 1.2411, "step": 1310 }, { "epoch": 0.04, "learning_rate": 4.998819375171267e-06, "loss": 1.1585, "step": 1311 }, { "epoch": 0.04, "learning_rate": 4.998811867836897e-06, "loss": 1.2182, "step": 1312 }, { "epoch": 0.04, "learning_rate": 4.9988043367150415e-06, "loss": 1.2373, "step": 1313 }, { "epoch": 0.04, "learning_rate": 4.9987967818057735e-06, "loss": 1.1693, "step": 1314 }, { "epoch": 0.04, "learning_rate": 4.9987892031091624e-06, "loss": 1.1127, "step": 1315 }, { "epoch": 0.04, "learning_rate": 4.998781600625282e-06, "loss": 1.2482, "step": 1316 }, { "epoch": 0.04, "learning_rate": 4.998773974354204e-06, "loss": 1.1218, "step": 1317 }, { "epoch": 0.04, "learning_rate": 4.998766324296001e-06, "loss": 1.3101, "step": 1318 }, { "epoch": 0.04, "learning_rate": 4.998758650450747e-06, "loss": 1.2413, "step": 1319 }, { "epoch": 0.04, "learning_rate": 4.998750952818513e-06, "loss": 1.0904, "step": 1320 }, { "epoch": 0.04, "learning_rate": 4.998743231399374e-06, "loss": 1.1758, "step": 1321 }, { "epoch": 0.04, "learning_rate": 4.9987354861934025e-06, "loss": 1.1472, "step": 1322 }, { "epoch": 0.04, "learning_rate": 4.998727717200673e-06, "loss": 1.1378, "step": 1323 }, { "epoch": 0.04, "learning_rate": 4.998719924421259e-06, "loss": 1.3068, "step": 1324 }, { "epoch": 0.04, "learning_rate": 4.998712107855235e-06, "loss": 1.183, "step": 1325 }, { "epoch": 0.04, "learning_rate": 4.998704267502674e-06, "loss": 1.3583, "step": 1326 }, { "epoch": 0.04, "learning_rate": 4.998696403363653e-06, "loss": 1.1131, "step": 1327 }, { "epoch": 0.04, "learning_rate": 4.998688515438245e-06, "loss": 1.1979, "step": 1328 }, { "epoch": 0.04, "learning_rate": 4.998680603726526e-06, "loss": 1.1226, "step": 1329 }, { "epoch": 0.04, "learning_rate": 4.9986726682285715e-06, "loss": 1.1897, "step": 1330 }, { "epoch": 0.04, "learning_rate": 4.998664708944456e-06, "loss": 1.2422, "step": 1331 }, { "epoch": 0.04, "learning_rate": 4.9986567258742555e-06, "loss": 1.1536, "step": 1332 }, { "epoch": 0.04, "learning_rate": 4.998648719018047e-06, "loss": 1.2736, "step": 1333 }, { "epoch": 0.04, "learning_rate": 4.998640688375906e-06, "loss": 1.1761, "step": 1334 }, { "epoch": 0.04, "learning_rate": 4.998632633947909e-06, "loss": 1.1676, "step": 1335 }, { "epoch": 0.04, "learning_rate": 4.998624555734133e-06, "loss": 1.1616, "step": 1336 }, { "epoch": 0.04, "learning_rate": 4.998616453734654e-06, "loss": 1.2911, "step": 1337 }, { "epoch": 0.04, "learning_rate": 4.99860832794955e-06, "loss": 1.298, "step": 1338 }, { "epoch": 0.04, "learning_rate": 4.9986001783788985e-06, "loss": 1.3102, "step": 1339 }, { "epoch": 0.04, "learning_rate": 4.998592005022776e-06, "loss": 1.1874, "step": 1340 }, { "epoch": 0.04, "learning_rate": 4.998583807881261e-06, "loss": 1.0962, "step": 1341 }, { "epoch": 0.04, "learning_rate": 4.998575586954432e-06, "loss": 1.1724, "step": 1342 }, { "epoch": 0.04, "learning_rate": 4.998567342242366e-06, "loss": 1.1174, "step": 1343 }, { "epoch": 0.04, "learning_rate": 4.9985590737451425e-06, "loss": 1.2355, "step": 1344 }, { "epoch": 0.04, "learning_rate": 4.998550781462841e-06, "loss": 1.1818, "step": 1345 }, { "epoch": 0.04, "learning_rate": 4.998542465395538e-06, "loss": 1.1931, "step": 1346 }, { "epoch": 0.04, "learning_rate": 4.998534125543315e-06, "loss": 1.1846, "step": 1347 }, { "epoch": 0.04, "learning_rate": 4.99852576190625e-06, "loss": 1.1802, "step": 1348 }, { "epoch": 0.04, "learning_rate": 4.998517374484424e-06, "loss": 1.2102, "step": 1349 }, { "epoch": 0.04, "learning_rate": 4.998508963277915e-06, "loss": 1.3833, "step": 1350 }, { "epoch": 0.04, "learning_rate": 4.998500528286804e-06, "loss": 1.1958, "step": 1351 }, { "epoch": 0.04, "learning_rate": 4.998492069511171e-06, "loss": 1.2758, "step": 1352 }, { "epoch": 0.04, "learning_rate": 4.998483586951098e-06, "loss": 1.1449, "step": 1353 }, { "epoch": 0.04, "learning_rate": 4.998475080606664e-06, "loss": 1.0632, "step": 1354 }, { "epoch": 0.04, "learning_rate": 4.99846655047795e-06, "loss": 1.209, "step": 1355 }, { "epoch": 0.04, "learning_rate": 4.998457996565038e-06, "loss": 1.1489, "step": 1356 }, { "epoch": 0.04, "learning_rate": 4.99844941886801e-06, "loss": 1.217, "step": 1357 }, { "epoch": 0.04, "learning_rate": 4.998440817386946e-06, "loss": 1.2353, "step": 1358 }, { "epoch": 0.04, "learning_rate": 4.998432192121929e-06, "loss": 1.1604, "step": 1359 }, { "epoch": 0.04, "learning_rate": 4.9984235430730395e-06, "loss": 1.1613, "step": 1360 }, { "epoch": 0.04, "learning_rate": 4.998414870240364e-06, "loss": 1.1868, "step": 1361 }, { "epoch": 0.04, "learning_rate": 4.99840617362398e-06, "loss": 1.2488, "step": 1362 }, { "epoch": 0.04, "learning_rate": 4.998397453223973e-06, "loss": 1.1479, "step": 1363 }, { "epoch": 0.04, "learning_rate": 4.9983887090404245e-06, "loss": 1.1649, "step": 1364 }, { "epoch": 0.04, "learning_rate": 4.99837994107342e-06, "loss": 1.1569, "step": 1365 }, { "epoch": 0.04, "learning_rate": 4.998371149323042e-06, "loss": 1.0776, "step": 1366 }, { "epoch": 0.04, "learning_rate": 4.998362333789374e-06, "loss": 1.2302, "step": 1367 }, { "epoch": 0.04, "learning_rate": 4.998353494472499e-06, "loss": 1.2625, "step": 1368 }, { "epoch": 0.04, "learning_rate": 4.998344631372501e-06, "loss": 1.0291, "step": 1369 }, { "epoch": 0.04, "learning_rate": 4.9983357444894674e-06, "loss": 1.2343, "step": 1370 }, { "epoch": 0.04, "learning_rate": 4.998326833823481e-06, "loss": 1.0707, "step": 1371 }, { "epoch": 0.04, "learning_rate": 4.998317899374624e-06, "loss": 1.2134, "step": 1372 }, { "epoch": 0.04, "learning_rate": 4.998308941142985e-06, "loss": 1.222, "step": 1373 }, { "epoch": 0.04, "learning_rate": 4.998299959128649e-06, "loss": 1.1685, "step": 1374 }, { "epoch": 0.04, "learning_rate": 4.9982909533316996e-06, "loss": 1.2791, "step": 1375 }, { "epoch": 0.04, "learning_rate": 4.998281923752224e-06, "loss": 1.1735, "step": 1376 }, { "epoch": 0.04, "learning_rate": 4.998272870390307e-06, "loss": 1.1858, "step": 1377 }, { "epoch": 0.04, "learning_rate": 4.998263793246036e-06, "loss": 1.1583, "step": 1378 }, { "epoch": 0.04, "learning_rate": 4.998254692319497e-06, "loss": 1.1561, "step": 1379 }, { "epoch": 0.04, "learning_rate": 4.9982455676107765e-06, "loss": 1.2388, "step": 1380 }, { "epoch": 0.04, "learning_rate": 4.998236419119962e-06, "loss": 1.1078, "step": 1381 }, { "epoch": 0.04, "learning_rate": 4.998227246847139e-06, "loss": 1.1591, "step": 1382 }, { "epoch": 0.04, "learning_rate": 4.998218050792396e-06, "loss": 1.2454, "step": 1383 }, { "epoch": 0.04, "learning_rate": 4.99820883095582e-06, "loss": 1.1569, "step": 1384 }, { "epoch": 0.04, "learning_rate": 4.9981995873375e-06, "loss": 1.175, "step": 1385 }, { "epoch": 0.04, "learning_rate": 4.998190319937522e-06, "loss": 1.2799, "step": 1386 }, { "epoch": 0.04, "learning_rate": 4.998181028755976e-06, "loss": 1.1968, "step": 1387 }, { "epoch": 0.04, "learning_rate": 4.99817171379295e-06, "loss": 1.2042, "step": 1388 }, { "epoch": 0.04, "learning_rate": 4.998162375048532e-06, "loss": 1.1487, "step": 1389 }, { "epoch": 0.04, "learning_rate": 4.998153012522812e-06, "loss": 1.157, "step": 1390 }, { "epoch": 0.04, "learning_rate": 4.9981436262158775e-06, "loss": 1.1346, "step": 1391 }, { "epoch": 0.04, "learning_rate": 4.99813421612782e-06, "loss": 1.2218, "step": 1392 }, { "epoch": 0.04, "learning_rate": 4.998124782258727e-06, "loss": 1.2579, "step": 1393 }, { "epoch": 0.04, "learning_rate": 4.9981153246086895e-06, "loss": 1.191, "step": 1394 }, { "epoch": 0.04, "learning_rate": 4.998105843177797e-06, "loss": 1.1713, "step": 1395 }, { "epoch": 0.04, "learning_rate": 4.99809633796614e-06, "loss": 1.1553, "step": 1396 }, { "epoch": 0.04, "learning_rate": 4.998086808973809e-06, "loss": 1.0659, "step": 1397 }, { "epoch": 0.04, "learning_rate": 4.998077256200895e-06, "loss": 1.2234, "step": 1398 }, { "epoch": 0.04, "learning_rate": 4.99806767964749e-06, "loss": 1.2722, "step": 1399 }, { "epoch": 0.04, "learning_rate": 4.998058079313681e-06, "loss": 1.185, "step": 1400 }, { "epoch": 0.04, "learning_rate": 4.998048455199563e-06, "loss": 1.2054, "step": 1401 }, { "epoch": 0.04, "learning_rate": 4.998038807305228e-06, "loss": 1.1964, "step": 1402 }, { "epoch": 0.04, "learning_rate": 4.998029135630766e-06, "loss": 1.0212, "step": 1403 }, { "epoch": 0.04, "learning_rate": 4.99801944017627e-06, "loss": 1.2871, "step": 1404 }, { "epoch": 0.04, "learning_rate": 4.998009720941831e-06, "loss": 1.2743, "step": 1405 }, { "epoch": 0.04, "learning_rate": 4.997999977927543e-06, "loss": 1.2203, "step": 1406 }, { "epoch": 0.04, "learning_rate": 4.997990211133499e-06, "loss": 1.1323, "step": 1407 }, { "epoch": 0.04, "learning_rate": 4.997980420559791e-06, "loss": 1.2367, "step": 1408 }, { "epoch": 0.04, "learning_rate": 4.997970606206512e-06, "loss": 1.142, "step": 1409 }, { "epoch": 0.04, "learning_rate": 4.9979607680737565e-06, "loss": 1.2618, "step": 1410 }, { "epoch": 0.04, "learning_rate": 4.997950906161617e-06, "loss": 1.1359, "step": 1411 }, { "epoch": 0.04, "learning_rate": 4.997941020470188e-06, "loss": 1.3521, "step": 1412 }, { "epoch": 0.04, "learning_rate": 4.997931110999564e-06, "loss": 1.3456, "step": 1413 }, { "epoch": 0.04, "learning_rate": 4.9979211777498386e-06, "loss": 1.1636, "step": 1414 }, { "epoch": 0.04, "learning_rate": 4.997911220721107e-06, "loss": 1.1298, "step": 1415 }, { "epoch": 0.04, "learning_rate": 4.997901239913462e-06, "loss": 1.145, "step": 1416 }, { "epoch": 0.04, "learning_rate": 4.997891235327002e-06, "loss": 1.1483, "step": 1417 }, { "epoch": 0.04, "learning_rate": 4.99788120696182e-06, "loss": 1.1073, "step": 1418 }, { "epoch": 0.04, "learning_rate": 4.997871154818011e-06, "loss": 1.2251, "step": 1419 }, { "epoch": 0.04, "learning_rate": 4.997861078895673e-06, "loss": 1.2023, "step": 1420 }, { "epoch": 0.04, "learning_rate": 4.9978509791949e-06, "loss": 1.1567, "step": 1421 }, { "epoch": 0.04, "learning_rate": 4.997840855715789e-06, "loss": 1.0558, "step": 1422 }, { "epoch": 0.04, "learning_rate": 4.997830708458435e-06, "loss": 1.1428, "step": 1423 }, { "epoch": 0.04, "learning_rate": 4.997820537422936e-06, "loss": 1.2295, "step": 1424 }, { "epoch": 0.04, "learning_rate": 4.99781034260939e-06, "loss": 1.2659, "step": 1425 }, { "epoch": 0.04, "learning_rate": 4.997800124017891e-06, "loss": 1.3099, "step": 1426 }, { "epoch": 0.04, "learning_rate": 4.997789881648538e-06, "loss": 1.0925, "step": 1427 }, { "epoch": 0.04, "learning_rate": 4.997779615501428e-06, "loss": 1.1285, "step": 1428 }, { "epoch": 0.04, "learning_rate": 4.99776932557666e-06, "loss": 1.111, "step": 1429 }, { "epoch": 0.04, "learning_rate": 4.997759011874331e-06, "loss": 1.2139, "step": 1430 }, { "epoch": 0.04, "learning_rate": 4.997748674394538e-06, "loss": 1.2056, "step": 1431 }, { "epoch": 0.04, "learning_rate": 4.997738313137381e-06, "loss": 1.2531, "step": 1432 }, { "epoch": 0.04, "learning_rate": 4.997727928102959e-06, "loss": 1.1431, "step": 1433 }, { "epoch": 0.04, "learning_rate": 4.997717519291369e-06, "loss": 1.1631, "step": 1434 }, { "epoch": 0.04, "learning_rate": 4.997707086702711e-06, "loss": 1.1643, "step": 1435 }, { "epoch": 0.04, "learning_rate": 4.9976966303370855e-06, "loss": 1.1473, "step": 1436 }, { "epoch": 0.04, "learning_rate": 4.997686150194591e-06, "loss": 1.0486, "step": 1437 }, { "epoch": 0.04, "learning_rate": 4.997675646275328e-06, "loss": 1.1455, "step": 1438 }, { "epoch": 0.04, "learning_rate": 4.997665118579394e-06, "loss": 1.1986, "step": 1439 }, { "epoch": 0.04, "learning_rate": 4.997654567106891e-06, "loss": 1.1876, "step": 1440 }, { "epoch": 0.04, "learning_rate": 4.99764399185792e-06, "loss": 1.0878, "step": 1441 }, { "epoch": 0.04, "learning_rate": 4.997633392832582e-06, "loss": 1.2119, "step": 1442 }, { "epoch": 0.04, "learning_rate": 4.997622770030976e-06, "loss": 1.2625, "step": 1443 }, { "epoch": 0.04, "learning_rate": 4.9976121234532035e-06, "loss": 1.2322, "step": 1444 }, { "epoch": 0.04, "learning_rate": 4.9976014530993674e-06, "loss": 1.2446, "step": 1445 }, { "epoch": 0.04, "learning_rate": 4.997590758969569e-06, "loss": 1.1074, "step": 1446 }, { "epoch": 0.04, "learning_rate": 4.997580041063909e-06, "loss": 1.0842, "step": 1447 }, { "epoch": 0.04, "learning_rate": 4.9975692993824895e-06, "loss": 1.1553, "step": 1448 }, { "epoch": 0.04, "learning_rate": 4.997558533925413e-06, "loss": 1.2311, "step": 1449 }, { "epoch": 0.04, "learning_rate": 4.997547744692782e-06, "loss": 1.1765, "step": 1450 }, { "epoch": 0.04, "learning_rate": 4.9975369316847e-06, "loss": 1.261, "step": 1451 }, { "epoch": 0.04, "learning_rate": 4.9975260949012685e-06, "loss": 1.0226, "step": 1452 }, { "epoch": 0.04, "learning_rate": 4.997515234342593e-06, "loss": 1.1461, "step": 1453 }, { "epoch": 0.04, "learning_rate": 4.9975043500087735e-06, "loss": 1.1948, "step": 1454 }, { "epoch": 0.04, "learning_rate": 4.997493441899917e-06, "loss": 1.2085, "step": 1455 }, { "epoch": 0.04, "learning_rate": 4.9974825100161236e-06, "loss": 1.0927, "step": 1456 }, { "epoch": 0.04, "learning_rate": 4.997471554357501e-06, "loss": 1.1628, "step": 1457 }, { "epoch": 0.04, "learning_rate": 4.997460574924152e-06, "loss": 1.1052, "step": 1458 }, { "epoch": 0.04, "learning_rate": 4.997449571716181e-06, "loss": 1.046, "step": 1459 }, { "epoch": 0.04, "learning_rate": 4.997438544733693e-06, "loss": 1.092, "step": 1460 }, { "epoch": 0.04, "learning_rate": 4.997427493976793e-06, "loss": 1.2162, "step": 1461 }, { "epoch": 0.04, "learning_rate": 4.997416419445585e-06, "loss": 1.1691, "step": 1462 }, { "epoch": 0.04, "learning_rate": 4.997405321140177e-06, "loss": 1.29, "step": 1463 }, { "epoch": 0.04, "learning_rate": 4.9973941990606726e-06, "loss": 1.1586, "step": 1464 }, { "epoch": 0.04, "learning_rate": 4.9973830532071775e-06, "loss": 1.1602, "step": 1465 }, { "epoch": 0.04, "learning_rate": 4.997371883579799e-06, "loss": 1.2015, "step": 1466 }, { "epoch": 0.04, "learning_rate": 4.997360690178643e-06, "loss": 1.1411, "step": 1467 }, { "epoch": 0.04, "learning_rate": 4.9973494730038165e-06, "loss": 1.2632, "step": 1468 }, { "epoch": 0.04, "learning_rate": 4.997338232055425e-06, "loss": 1.2042, "step": 1469 }, { "epoch": 0.04, "learning_rate": 4.9973269673335765e-06, "loss": 1.2416, "step": 1470 }, { "epoch": 0.04, "learning_rate": 4.997315678838378e-06, "loss": 1.2423, "step": 1471 }, { "epoch": 0.04, "learning_rate": 4.9973043665699375e-06, "loss": 1.2742, "step": 1472 }, { "epoch": 0.04, "learning_rate": 4.997293030528362e-06, "loss": 1.1768, "step": 1473 }, { "epoch": 0.04, "learning_rate": 4.997281670713759e-06, "loss": 1.2313, "step": 1474 }, { "epoch": 0.04, "learning_rate": 4.997270287126238e-06, "loss": 1.3273, "step": 1475 }, { "epoch": 0.04, "learning_rate": 4.997258879765906e-06, "loss": 1.0893, "step": 1476 }, { "epoch": 0.04, "learning_rate": 4.997247448632873e-06, "loss": 1.1846, "step": 1477 }, { "epoch": 0.04, "learning_rate": 4.997235993727245e-06, "loss": 1.1807, "step": 1478 }, { "epoch": 0.04, "learning_rate": 4.997224515049135e-06, "loss": 1.1299, "step": 1479 }, { "epoch": 0.04, "learning_rate": 4.997213012598649e-06, "loss": 1.1835, "step": 1480 }, { "epoch": 0.04, "learning_rate": 4.997201486375899e-06, "loss": 1.2907, "step": 1481 }, { "epoch": 0.04, "learning_rate": 4.997189936380993e-06, "loss": 1.1105, "step": 1482 }, { "epoch": 0.04, "learning_rate": 4.9971783626140416e-06, "loss": 1.2328, "step": 1483 }, { "epoch": 0.04, "learning_rate": 4.997166765075155e-06, "loss": 1.1407, "step": 1484 }, { "epoch": 0.04, "learning_rate": 4.997155143764444e-06, "loss": 1.0615, "step": 1485 }, { "epoch": 0.04, "learning_rate": 4.997143498682017e-06, "loss": 1.2443, "step": 1486 }, { "epoch": 0.04, "learning_rate": 4.997131829827988e-06, "loss": 1.2174, "step": 1487 }, { "epoch": 0.04, "learning_rate": 4.997120137202466e-06, "loss": 1.1293, "step": 1488 }, { "epoch": 0.04, "learning_rate": 4.9971084208055635e-06, "loss": 1.2218, "step": 1489 }, { "epoch": 0.04, "learning_rate": 4.997096680637391e-06, "loss": 1.1495, "step": 1490 }, { "epoch": 0.04, "learning_rate": 4.997084916698061e-06, "loss": 1.1042, "step": 1491 }, { "epoch": 0.04, "learning_rate": 4.997073128987685e-06, "loss": 1.2842, "step": 1492 }, { "epoch": 0.04, "learning_rate": 4.997061317506376e-06, "loss": 1.1063, "step": 1493 }, { "epoch": 0.05, "learning_rate": 4.997049482254246e-06, "loss": 1.1703, "step": 1494 }, { "epoch": 0.05, "learning_rate": 4.997037623231406e-06, "loss": 1.0982, "step": 1495 }, { "epoch": 0.05, "learning_rate": 4.9970257404379715e-06, "loss": 1.2062, "step": 1496 }, { "epoch": 0.05, "learning_rate": 4.9970138338740544e-06, "loss": 1.1735, "step": 1497 }, { "epoch": 0.05, "learning_rate": 4.997001903539769e-06, "loss": 1.1236, "step": 1498 }, { "epoch": 0.05, "learning_rate": 4.996989949435227e-06, "loss": 1.2139, "step": 1499 }, { "epoch": 0.05, "learning_rate": 4.996977971560544e-06, "loss": 1.0888, "step": 1500 }, { "epoch": 0.05, "learning_rate": 4.996965969915833e-06, "loss": 1.1982, "step": 1501 }, { "epoch": 0.05, "learning_rate": 4.9969539445012084e-06, "loss": 1.2223, "step": 1502 }, { "epoch": 0.05, "learning_rate": 4.996941895316785e-06, "loss": 1.0839, "step": 1503 }, { "epoch": 0.05, "learning_rate": 4.996929822362677e-06, "loss": 1.1498, "step": 1504 }, { "epoch": 0.05, "learning_rate": 4.996917725639e-06, "loss": 1.1985, "step": 1505 }, { "epoch": 0.05, "learning_rate": 4.996905605145869e-06, "loss": 1.1567, "step": 1506 }, { "epoch": 0.05, "learning_rate": 4.9968934608833986e-06, "loss": 1.1472, "step": 1507 }, { "epoch": 0.05, "learning_rate": 4.996881292851705e-06, "loss": 1.1729, "step": 1508 }, { "epoch": 0.05, "learning_rate": 4.996869101050905e-06, "loss": 1.1501, "step": 1509 }, { "epoch": 0.05, "learning_rate": 4.996856885481113e-06, "loss": 1.0624, "step": 1510 }, { "epoch": 0.05, "learning_rate": 4.996844646142446e-06, "loss": 1.1618, "step": 1511 }, { "epoch": 0.05, "learning_rate": 4.99683238303502e-06, "loss": 1.2357, "step": 1512 }, { "epoch": 0.05, "learning_rate": 4.996820096158953e-06, "loss": 1.1534, "step": 1513 }, { "epoch": 0.05, "learning_rate": 4.996807785514361e-06, "loss": 1.2262, "step": 1514 }, { "epoch": 0.05, "learning_rate": 4.996795451101361e-06, "loss": 1.191, "step": 1515 }, { "epoch": 0.05, "learning_rate": 4.996783092920071e-06, "loss": 1.2784, "step": 1516 }, { "epoch": 0.05, "learning_rate": 4.996770710970609e-06, "loss": 1.18, "step": 1517 }, { "epoch": 0.05, "learning_rate": 4.996758305253092e-06, "loss": 1.1997, "step": 1518 }, { "epoch": 0.05, "learning_rate": 4.996745875767638e-06, "loss": 1.1383, "step": 1519 }, { "epoch": 0.05, "learning_rate": 4.996733422514366e-06, "loss": 1.2999, "step": 1520 }, { "epoch": 0.05, "learning_rate": 4.996720945493394e-06, "loss": 1.1683, "step": 1521 }, { "epoch": 0.05, "learning_rate": 4.996708444704842e-06, "loss": 1.1771, "step": 1522 }, { "epoch": 0.05, "learning_rate": 4.9966959201488275e-06, "loss": 1.2676, "step": 1523 }, { "epoch": 0.05, "learning_rate": 4.99668337182547e-06, "loss": 1.1324, "step": 1524 }, { "epoch": 0.05, "learning_rate": 4.99667079973489e-06, "loss": 1.2147, "step": 1525 }, { "epoch": 0.05, "learning_rate": 4.996658203877205e-06, "loss": 1.2349, "step": 1526 }, { "epoch": 0.05, "learning_rate": 4.996645584252538e-06, "loss": 1.224, "step": 1527 }, { "epoch": 0.05, "learning_rate": 4.996632940861006e-06, "loss": 1.2042, "step": 1528 }, { "epoch": 0.05, "learning_rate": 4.9966202737027315e-06, "loss": 1.3643, "step": 1529 }, { "epoch": 0.05, "learning_rate": 4.996607582777835e-06, "loss": 1.2596, "step": 1530 }, { "epoch": 0.05, "learning_rate": 4.996594868086436e-06, "loss": 1.2344, "step": 1531 }, { "epoch": 0.05, "learning_rate": 4.996582129628656e-06, "loss": 1.2437, "step": 1532 }, { "epoch": 0.05, "learning_rate": 4.996569367404617e-06, "loss": 1.1772, "step": 1533 }, { "epoch": 0.05, "learning_rate": 4.99655658141444e-06, "loss": 1.1131, "step": 1534 }, { "epoch": 0.05, "learning_rate": 4.996543771658246e-06, "loss": 1.1116, "step": 1535 }, { "epoch": 0.05, "learning_rate": 4.996530938136159e-06, "loss": 1.0788, "step": 1536 }, { "epoch": 0.05, "learning_rate": 4.996518080848299e-06, "loss": 1.2013, "step": 1537 }, { "epoch": 0.05, "learning_rate": 4.996505199794789e-06, "loss": 1.0881, "step": 1538 }, { "epoch": 0.05, "learning_rate": 4.996492294975753e-06, "loss": 1.1772, "step": 1539 }, { "epoch": 0.05, "learning_rate": 4.996479366391312e-06, "loss": 1.15, "step": 1540 }, { "epoch": 0.05, "learning_rate": 4.99646641404159e-06, "loss": 1.1144, "step": 1541 }, { "epoch": 0.05, "learning_rate": 4.996453437926709e-06, "loss": 1.1946, "step": 1542 }, { "epoch": 0.05, "learning_rate": 4.996440438046795e-06, "loss": 1.1885, "step": 1543 }, { "epoch": 0.05, "learning_rate": 4.9964274144019695e-06, "loss": 1.3342, "step": 1544 }, { "epoch": 0.05, "learning_rate": 4.9964143669923575e-06, "loss": 1.1249, "step": 1545 }, { "epoch": 0.05, "learning_rate": 4.996401295818083e-06, "loss": 1.1367, "step": 1546 }, { "epoch": 0.05, "learning_rate": 4.996388200879271e-06, "loss": 1.2043, "step": 1547 }, { "epoch": 0.05, "learning_rate": 4.996375082176045e-06, "loss": 1.2315, "step": 1548 }, { "epoch": 0.05, "learning_rate": 4.996361939708531e-06, "loss": 1.2769, "step": 1549 }, { "epoch": 0.05, "learning_rate": 4.996348773476854e-06, "loss": 1.1766, "step": 1550 }, { "epoch": 0.05, "learning_rate": 4.9963355834811375e-06, "loss": 1.1169, "step": 1551 }, { "epoch": 0.05, "learning_rate": 4.996322369721509e-06, "loss": 1.174, "step": 1552 }, { "epoch": 0.05, "learning_rate": 4.996309132198095e-06, "loss": 1.1461, "step": 1553 }, { "epoch": 0.05, "learning_rate": 4.996295870911019e-06, "loss": 1.354, "step": 1554 }, { "epoch": 0.05, "learning_rate": 4.996282585860409e-06, "loss": 1.1774, "step": 1555 }, { "epoch": 0.05, "learning_rate": 4.996269277046391e-06, "loss": 1.1967, "step": 1556 }, { "epoch": 0.05, "learning_rate": 4.996255944469092e-06, "loss": 1.2192, "step": 1557 }, { "epoch": 0.05, "learning_rate": 4.9962425881286385e-06, "loss": 1.1819, "step": 1558 }, { "epoch": 0.05, "learning_rate": 4.9962292080251575e-06, "loss": 1.1674, "step": 1559 }, { "epoch": 0.05, "learning_rate": 4.996215804158777e-06, "loss": 1.1873, "step": 1560 }, { "epoch": 0.05, "learning_rate": 4.996202376529625e-06, "loss": 1.3192, "step": 1561 }, { "epoch": 0.05, "learning_rate": 4.996188925137827e-06, "loss": 1.1459, "step": 1562 }, { "epoch": 0.05, "learning_rate": 4.9961754499835136e-06, "loss": 1.1735, "step": 1563 }, { "epoch": 0.05, "learning_rate": 4.9961619510668125e-06, "loss": 1.166, "step": 1564 }, { "epoch": 0.05, "learning_rate": 4.996148428387851e-06, "loss": 1.0241, "step": 1565 }, { "epoch": 0.05, "learning_rate": 4.996134881946759e-06, "loss": 1.2385, "step": 1566 }, { "epoch": 0.05, "learning_rate": 4.996121311743665e-06, "loss": 1.2433, "step": 1567 }, { "epoch": 0.05, "learning_rate": 4.996107717778698e-06, "loss": 1.1202, "step": 1568 }, { "epoch": 0.05, "learning_rate": 4.996094100051988e-06, "loss": 1.1934, "step": 1569 }, { "epoch": 0.05, "learning_rate": 4.996080458563664e-06, "loss": 1.1459, "step": 1570 }, { "epoch": 0.05, "learning_rate": 4.9960667933138575e-06, "loss": 1.0416, "step": 1571 }, { "epoch": 0.05, "learning_rate": 4.996053104302696e-06, "loss": 1.1928, "step": 1572 }, { "epoch": 0.05, "learning_rate": 4.996039391530312e-06, "loss": 1.1469, "step": 1573 }, { "epoch": 0.05, "learning_rate": 4.9960256549968335e-06, "loss": 1.1815, "step": 1574 }, { "epoch": 0.05, "learning_rate": 4.996011894702394e-06, "loss": 1.2447, "step": 1575 }, { "epoch": 0.05, "learning_rate": 4.995998110647123e-06, "loss": 1.1324, "step": 1576 }, { "epoch": 0.05, "learning_rate": 4.995984302831153e-06, "loss": 1.1459, "step": 1577 }, { "epoch": 0.05, "learning_rate": 4.995970471254613e-06, "loss": 1.1298, "step": 1578 }, { "epoch": 0.05, "learning_rate": 4.995956615917637e-06, "loss": 1.2235, "step": 1579 }, { "epoch": 0.05, "learning_rate": 4.995942736820357e-06, "loss": 1.1102, "step": 1580 }, { "epoch": 0.05, "learning_rate": 4.9959288339629034e-06, "loss": 1.1386, "step": 1581 }, { "epoch": 0.05, "learning_rate": 4.99591490734541e-06, "loss": 1.0818, "step": 1582 }, { "epoch": 0.05, "learning_rate": 4.9959009569680074e-06, "loss": 1.1465, "step": 1583 }, { "epoch": 0.05, "learning_rate": 4.995886982830831e-06, "loss": 1.1124, "step": 1584 }, { "epoch": 0.05, "learning_rate": 4.995872984934012e-06, "loss": 1.271, "step": 1585 }, { "epoch": 0.05, "learning_rate": 4.995858963277685e-06, "loss": 1.1163, "step": 1586 }, { "epoch": 0.05, "learning_rate": 4.995844917861981e-06, "loss": 1.1763, "step": 1587 }, { "epoch": 0.05, "learning_rate": 4.9958308486870375e-06, "loss": 1.2415, "step": 1588 }, { "epoch": 0.05, "learning_rate": 4.995816755752985e-06, "loss": 1.181, "step": 1589 }, { "epoch": 0.05, "learning_rate": 4.995802639059959e-06, "loss": 1.1247, "step": 1590 }, { "epoch": 0.05, "learning_rate": 4.995788498608094e-06, "loss": 1.1912, "step": 1591 }, { "epoch": 0.05, "learning_rate": 4.995774334397525e-06, "loss": 1.1967, "step": 1592 }, { "epoch": 0.05, "learning_rate": 4.995760146428387e-06, "loss": 1.1281, "step": 1593 }, { "epoch": 0.05, "learning_rate": 4.995745934700813e-06, "loss": 1.1555, "step": 1594 }, { "epoch": 0.05, "learning_rate": 4.995731699214941e-06, "loss": 1.1896, "step": 1595 }, { "epoch": 0.05, "learning_rate": 4.9957174399709045e-06, "loss": 1.192, "step": 1596 }, { "epoch": 0.05, "learning_rate": 4.995703156968839e-06, "loss": 1.051, "step": 1597 }, { "epoch": 0.05, "learning_rate": 4.995688850208882e-06, "loss": 1.2188, "step": 1598 }, { "epoch": 0.05, "learning_rate": 4.99567451969117e-06, "loss": 1.1842, "step": 1599 }, { "epoch": 0.05, "learning_rate": 4.995660165415838e-06, "loss": 1.1573, "step": 1600 }, { "epoch": 0.05, "learning_rate": 4.9956457873830235e-06, "loss": 1.239, "step": 1601 }, { "epoch": 0.05, "learning_rate": 4.995631385592862e-06, "loss": 1.1345, "step": 1602 }, { "epoch": 0.05, "learning_rate": 4.995616960045493e-06, "loss": 1.0983, "step": 1603 }, { "epoch": 0.05, "learning_rate": 4.995602510741051e-06, "loss": 1.2007, "step": 1604 }, { "epoch": 0.05, "learning_rate": 4.995588037679676e-06, "loss": 1.1747, "step": 1605 }, { "epoch": 0.05, "learning_rate": 4.995573540861505e-06, "loss": 1.1755, "step": 1606 }, { "epoch": 0.05, "learning_rate": 4.995559020286676e-06, "loss": 1.1733, "step": 1607 }, { "epoch": 0.05, "learning_rate": 4.995544475955326e-06, "loss": 1.1702, "step": 1608 }, { "epoch": 0.05, "learning_rate": 4.995529907867595e-06, "loss": 1.2209, "step": 1609 }, { "epoch": 0.05, "learning_rate": 4.99551531602362e-06, "loss": 1.278, "step": 1610 }, { "epoch": 0.05, "learning_rate": 4.995500700423543e-06, "loss": 1.1365, "step": 1611 }, { "epoch": 0.05, "learning_rate": 4.9954860610675e-06, "loss": 1.1733, "step": 1612 }, { "epoch": 0.05, "learning_rate": 4.995471397955632e-06, "loss": 1.0359, "step": 1613 }, { "epoch": 0.05, "learning_rate": 4.995456711088078e-06, "loss": 1.116, "step": 1614 }, { "epoch": 0.05, "learning_rate": 4.995442000464978e-06, "loss": 1.1791, "step": 1615 }, { "epoch": 0.05, "learning_rate": 4.995427266086472e-06, "loss": 1.1511, "step": 1616 }, { "epoch": 0.05, "learning_rate": 4.9954125079527005e-06, "loss": 1.2079, "step": 1617 }, { "epoch": 0.05, "learning_rate": 4.995397726063804e-06, "loss": 1.2311, "step": 1618 }, { "epoch": 0.05, "learning_rate": 4.995382920419922e-06, "loss": 1.3351, "step": 1619 }, { "epoch": 0.05, "learning_rate": 4.995368091021198e-06, "loss": 1.1236, "step": 1620 }, { "epoch": 0.05, "learning_rate": 4.99535323786777e-06, "loss": 1.0858, "step": 1621 }, { "epoch": 0.05, "learning_rate": 4.995338360959782e-06, "loss": 1.1331, "step": 1622 }, { "epoch": 0.05, "learning_rate": 4.995323460297373e-06, "loss": 1.2081, "step": 1623 }, { "epoch": 0.05, "learning_rate": 4.995308535880688e-06, "loss": 1.2941, "step": 1624 }, { "epoch": 0.05, "learning_rate": 4.995293587709868e-06, "loss": 1.1794, "step": 1625 }, { "epoch": 0.05, "learning_rate": 4.995278615785053e-06, "loss": 1.1582, "step": 1626 }, { "epoch": 0.05, "learning_rate": 4.995263620106389e-06, "loss": 1.1793, "step": 1627 }, { "epoch": 0.05, "learning_rate": 4.995248600674016e-06, "loss": 1.1071, "step": 1628 }, { "epoch": 0.05, "learning_rate": 4.995233557488079e-06, "loss": 1.2351, "step": 1629 }, { "epoch": 0.05, "learning_rate": 4.995218490548719e-06, "loss": 1.1041, "step": 1630 }, { "epoch": 0.05, "learning_rate": 4.995203399856081e-06, "loss": 1.2623, "step": 1631 }, { "epoch": 0.05, "learning_rate": 4.995188285410309e-06, "loss": 1.1351, "step": 1632 }, { "epoch": 0.05, "learning_rate": 4.995173147211546e-06, "loss": 1.1996, "step": 1633 }, { "epoch": 0.05, "learning_rate": 4.995157985259936e-06, "loss": 1.137, "step": 1634 }, { "epoch": 0.05, "learning_rate": 4.9951427995556246e-06, "loss": 1.1227, "step": 1635 }, { "epoch": 0.05, "learning_rate": 4.995127590098755e-06, "loss": 1.1649, "step": 1636 }, { "epoch": 0.05, "learning_rate": 4.995112356889472e-06, "loss": 1.1418, "step": 1637 }, { "epoch": 0.05, "learning_rate": 4.995097099927922e-06, "loss": 1.227, "step": 1638 }, { "epoch": 0.05, "learning_rate": 4.995081819214248e-06, "loss": 1.1496, "step": 1639 }, { "epoch": 0.05, "learning_rate": 4.995066514748598e-06, "loss": 1.0347, "step": 1640 }, { "epoch": 0.05, "learning_rate": 4.9950511865311155e-06, "loss": 1.2484, "step": 1641 }, { "epoch": 0.05, "learning_rate": 4.995035834561948e-06, "loss": 1.1472, "step": 1642 }, { "epoch": 0.05, "learning_rate": 4.995020458841241e-06, "loss": 1.2468, "step": 1643 }, { "epoch": 0.05, "learning_rate": 4.99500505936914e-06, "loss": 1.1393, "step": 1644 }, { "epoch": 0.05, "learning_rate": 4.9949896361457936e-06, "loss": 1.0506, "step": 1645 }, { "epoch": 0.05, "learning_rate": 4.994974189171346e-06, "loss": 1.1703, "step": 1646 }, { "epoch": 0.05, "learning_rate": 4.9949587184459484e-06, "loss": 1.2708, "step": 1647 }, { "epoch": 0.05, "learning_rate": 4.9949432239697435e-06, "loss": 1.1866, "step": 1648 }, { "epoch": 0.05, "learning_rate": 4.99492770574288e-06, "loss": 1.3478, "step": 1649 }, { "epoch": 0.05, "learning_rate": 4.994912163765508e-06, "loss": 1.2264, "step": 1650 }, { "epoch": 0.05, "learning_rate": 4.9948965980377726e-06, "loss": 1.2232, "step": 1651 }, { "epoch": 0.05, "learning_rate": 4.994881008559824e-06, "loss": 1.067, "step": 1652 }, { "epoch": 0.05, "learning_rate": 4.994865395331809e-06, "loss": 1.0826, "step": 1653 }, { "epoch": 0.05, "learning_rate": 4.994849758353878e-06, "loss": 1.1506, "step": 1654 }, { "epoch": 0.05, "learning_rate": 4.994834097626178e-06, "loss": 1.2198, "step": 1655 }, { "epoch": 0.05, "learning_rate": 4.99481841314886e-06, "loss": 1.2283, "step": 1656 }, { "epoch": 0.05, "learning_rate": 4.994802704922071e-06, "loss": 1.1685, "step": 1657 }, { "epoch": 0.05, "learning_rate": 4.994786972945963e-06, "loss": 1.2269, "step": 1658 }, { "epoch": 0.05, "learning_rate": 4.994771217220683e-06, "loss": 1.0861, "step": 1659 }, { "epoch": 0.05, "learning_rate": 4.9947554377463835e-06, "loss": 1.1929, "step": 1660 }, { "epoch": 0.05, "learning_rate": 4.994739634523213e-06, "loss": 1.1861, "step": 1661 }, { "epoch": 0.05, "learning_rate": 4.994723807551324e-06, "loss": 1.1339, "step": 1662 }, { "epoch": 0.05, "learning_rate": 4.994707956830865e-06, "loss": 1.1885, "step": 1663 }, { "epoch": 0.05, "learning_rate": 4.9946920823619885e-06, "loss": 1.1979, "step": 1664 }, { "epoch": 0.05, "learning_rate": 4.994676184144844e-06, "loss": 1.1755, "step": 1665 }, { "epoch": 0.05, "learning_rate": 4.9946602621795835e-06, "loss": 1.1328, "step": 1666 }, { "epoch": 0.05, "learning_rate": 4.994644316466359e-06, "loss": 1.1513, "step": 1667 }, { "epoch": 0.05, "learning_rate": 4.994628347005323e-06, "loss": 1.1221, "step": 1668 }, { "epoch": 0.05, "learning_rate": 4.994612353796626e-06, "loss": 1.2172, "step": 1669 }, { "epoch": 0.05, "learning_rate": 4.994596336840421e-06, "loss": 1.1649, "step": 1670 }, { "epoch": 0.05, "learning_rate": 4.9945802961368594e-06, "loss": 1.2111, "step": 1671 }, { "epoch": 0.05, "learning_rate": 4.994564231686096e-06, "loss": 1.2229, "step": 1672 }, { "epoch": 0.05, "learning_rate": 4.9945481434882815e-06, "loss": 1.1837, "step": 1673 }, { "epoch": 0.05, "learning_rate": 4.994532031543571e-06, "loss": 1.2053, "step": 1674 }, { "epoch": 0.05, "learning_rate": 4.994515895852117e-06, "loss": 1.1487, "step": 1675 }, { "epoch": 0.05, "learning_rate": 4.994499736414072e-06, "loss": 1.1232, "step": 1676 }, { "epoch": 0.05, "learning_rate": 4.994483553229592e-06, "loss": 1.191, "step": 1677 }, { "epoch": 0.05, "learning_rate": 4.994467346298829e-06, "loss": 1.072, "step": 1678 }, { "epoch": 0.05, "learning_rate": 4.994451115621939e-06, "loss": 1.1729, "step": 1679 }, { "epoch": 0.05, "learning_rate": 4.994434861199076e-06, "loss": 1.2803, "step": 1680 }, { "epoch": 0.05, "learning_rate": 4.994418583030393e-06, "loss": 1.2723, "step": 1681 }, { "epoch": 0.05, "learning_rate": 4.994402281116048e-06, "loss": 1.1328, "step": 1682 }, { "epoch": 0.05, "learning_rate": 4.994385955456193e-06, "loss": 1.1125, "step": 1683 }, { "epoch": 0.05, "learning_rate": 4.994369606050987e-06, "loss": 1.0543, "step": 1684 }, { "epoch": 0.05, "learning_rate": 4.994353232900583e-06, "loss": 1.2303, "step": 1685 }, { "epoch": 0.05, "learning_rate": 4.994336836005137e-06, "loss": 1.2257, "step": 1686 }, { "epoch": 0.05, "learning_rate": 4.994320415364806e-06, "loss": 1.3856, "step": 1687 }, { "epoch": 0.05, "learning_rate": 4.994303970979746e-06, "loss": 1.15, "step": 1688 }, { "epoch": 0.05, "learning_rate": 4.994287502850113e-06, "loss": 1.0637, "step": 1689 }, { "epoch": 0.05, "learning_rate": 4.994271010976065e-06, "loss": 1.0891, "step": 1690 }, { "epoch": 0.05, "learning_rate": 4.9942544953577575e-06, "loss": 1.1115, "step": 1691 }, { "epoch": 0.05, "learning_rate": 4.994237955995349e-06, "loss": 1.3015, "step": 1692 }, { "epoch": 0.05, "learning_rate": 4.994221392888997e-06, "loss": 1.225, "step": 1693 }, { "epoch": 0.05, "learning_rate": 4.994204806038857e-06, "loss": 1.3075, "step": 1694 }, { "epoch": 0.05, "learning_rate": 4.99418819544509e-06, "loss": 1.1508, "step": 1695 }, { "epoch": 0.05, "learning_rate": 4.994171561107852e-06, "loss": 1.152, "step": 1696 }, { "epoch": 0.05, "learning_rate": 4.9941549030273015e-06, "loss": 1.137, "step": 1697 }, { "epoch": 0.05, "learning_rate": 4.9941382212035986e-06, "loss": 1.2516, "step": 1698 }, { "epoch": 0.05, "learning_rate": 4.9941215156369006e-06, "loss": 1.2577, "step": 1699 }, { "epoch": 0.05, "learning_rate": 4.994104786327367e-06, "loss": 1.2245, "step": 1700 }, { "epoch": 0.05, "learning_rate": 4.994088033275156e-06, "loss": 1.1021, "step": 1701 }, { "epoch": 0.05, "learning_rate": 4.9940712564804296e-06, "loss": 1.1862, "step": 1702 }, { "epoch": 0.05, "learning_rate": 4.9940544559433455e-06, "loss": 1.1258, "step": 1703 }, { "epoch": 0.05, "learning_rate": 4.9940376316640634e-06, "loss": 1.2409, "step": 1704 }, { "epoch": 0.05, "learning_rate": 4.994020783642746e-06, "loss": 1.3036, "step": 1705 }, { "epoch": 0.05, "learning_rate": 4.99400391187955e-06, "loss": 1.2081, "step": 1706 }, { "epoch": 0.05, "learning_rate": 4.99398701637464e-06, "loss": 1.1615, "step": 1707 }, { "epoch": 0.05, "learning_rate": 4.993970097128172e-06, "loss": 1.2204, "step": 1708 }, { "epoch": 0.05, "learning_rate": 4.993953154140312e-06, "loss": 1.2557, "step": 1709 }, { "epoch": 0.05, "learning_rate": 4.993936187411218e-06, "loss": 1.1786, "step": 1710 }, { "epoch": 0.05, "learning_rate": 4.993919196941054e-06, "loss": 1.2738, "step": 1711 }, { "epoch": 0.05, "learning_rate": 4.993902182729979e-06, "loss": 1.1138, "step": 1712 }, { "epoch": 0.05, "learning_rate": 4.9938851447781565e-06, "loss": 1.2151, "step": 1713 }, { "epoch": 0.05, "learning_rate": 4.993868083085749e-06, "loss": 1.1438, "step": 1714 }, { "epoch": 0.05, "learning_rate": 4.993850997652918e-06, "loss": 1.0769, "step": 1715 }, { "epoch": 0.05, "learning_rate": 4.993833888479827e-06, "loss": 1.0342, "step": 1716 }, { "epoch": 0.05, "learning_rate": 4.993816755566638e-06, "loss": 1.1973, "step": 1717 }, { "epoch": 0.05, "learning_rate": 4.993799598913515e-06, "loss": 1.2147, "step": 1718 }, { "epoch": 0.05, "learning_rate": 4.993782418520621e-06, "loss": 1.0717, "step": 1719 }, { "epoch": 0.05, "learning_rate": 4.993765214388119e-06, "loss": 1.1673, "step": 1720 }, { "epoch": 0.05, "learning_rate": 4.993747986516173e-06, "loss": 1.2903, "step": 1721 }, { "epoch": 0.05, "learning_rate": 4.993730734904947e-06, "loss": 1.0559, "step": 1722 }, { "epoch": 0.05, "learning_rate": 4.993713459554606e-06, "loss": 1.1838, "step": 1723 }, { "epoch": 0.05, "learning_rate": 4.993696160465313e-06, "loss": 1.1482, "step": 1724 }, { "epoch": 0.05, "learning_rate": 4.993678837637235e-06, "loss": 1.1609, "step": 1725 }, { "epoch": 0.05, "learning_rate": 4.993661491070535e-06, "loss": 1.1902, "step": 1726 }, { "epoch": 0.05, "learning_rate": 4.993644120765379e-06, "loss": 1.2123, "step": 1727 }, { "epoch": 0.05, "learning_rate": 4.993626726721931e-06, "loss": 1.1949, "step": 1728 }, { "epoch": 0.05, "learning_rate": 4.993609308940357e-06, "loss": 1.223, "step": 1729 }, { "epoch": 0.05, "learning_rate": 4.993591867420825e-06, "loss": 1.1504, "step": 1730 }, { "epoch": 0.05, "learning_rate": 4.993574402163498e-06, "loss": 1.2003, "step": 1731 }, { "epoch": 0.05, "learning_rate": 4.993556913168545e-06, "loss": 1.1251, "step": 1732 }, { "epoch": 0.05, "learning_rate": 4.993539400436129e-06, "loss": 1.2101, "step": 1733 }, { "epoch": 0.05, "learning_rate": 4.9935218639664205e-06, "loss": 1.1796, "step": 1734 }, { "epoch": 0.05, "learning_rate": 4.993504303759585e-06, "loss": 1.1869, "step": 1735 }, { "epoch": 0.05, "learning_rate": 4.993486719815789e-06, "loss": 1.136, "step": 1736 }, { "epoch": 0.05, "learning_rate": 4.9934691121351995e-06, "loss": 1.2129, "step": 1737 }, { "epoch": 0.05, "learning_rate": 4.993451480717986e-06, "loss": 1.0723, "step": 1738 }, { "epoch": 0.05, "learning_rate": 4.993433825564315e-06, "loss": 1.2408, "step": 1739 }, { "epoch": 0.05, "learning_rate": 4.9934161466743545e-06, "loss": 1.1537, "step": 1740 }, { "epoch": 0.05, "learning_rate": 4.993398444048274e-06, "loss": 1.0949, "step": 1741 }, { "epoch": 0.05, "learning_rate": 4.99338071768624e-06, "loss": 1.2535, "step": 1742 }, { "epoch": 0.05, "learning_rate": 4.993362967588423e-06, "loss": 1.1711, "step": 1743 }, { "epoch": 0.05, "learning_rate": 4.993345193754992e-06, "loss": 1.1674, "step": 1744 }, { "epoch": 0.05, "learning_rate": 4.993327396186115e-06, "loss": 1.1352, "step": 1745 }, { "epoch": 0.05, "learning_rate": 4.993309574881962e-06, "loss": 1.1139, "step": 1746 }, { "epoch": 0.05, "learning_rate": 4.993291729842703e-06, "loss": 1.1443, "step": 1747 }, { "epoch": 0.05, "learning_rate": 4.993273861068507e-06, "loss": 1.1875, "step": 1748 }, { "epoch": 0.05, "learning_rate": 4.993255968559545e-06, "loss": 1.3621, "step": 1749 }, { "epoch": 0.05, "learning_rate": 4.993238052315987e-06, "loss": 1.3691, "step": 1750 }, { "epoch": 0.05, "learning_rate": 4.9932201123380034e-06, "loss": 1.1616, "step": 1751 }, { "epoch": 0.05, "learning_rate": 4.9932021486257656e-06, "loss": 1.1288, "step": 1752 }, { "epoch": 0.05, "learning_rate": 4.993184161179443e-06, "loss": 1.1696, "step": 1753 }, { "epoch": 0.05, "learning_rate": 4.993166149999209e-06, "loss": 1.0894, "step": 1754 }, { "epoch": 0.05, "learning_rate": 4.993148115085233e-06, "loss": 1.2091, "step": 1755 }, { "epoch": 0.05, "learning_rate": 4.9931300564376885e-06, "loss": 1.0378, "step": 1756 }, { "epoch": 0.05, "learning_rate": 4.993111974056746e-06, "loss": 1.2112, "step": 1757 }, { "epoch": 0.05, "learning_rate": 4.993093867942579e-06, "loss": 1.2089, "step": 1758 }, { "epoch": 0.05, "learning_rate": 4.9930757380953585e-06, "loss": 1.1425, "step": 1759 }, { "epoch": 0.05, "learning_rate": 4.993057584515259e-06, "loss": 1.2323, "step": 1760 }, { "epoch": 0.05, "learning_rate": 4.99303940720245e-06, "loss": 1.2281, "step": 1761 }, { "epoch": 0.05, "learning_rate": 4.993021206157107e-06, "loss": 1.3446, "step": 1762 }, { "epoch": 0.05, "learning_rate": 4.993002981379404e-06, "loss": 1.0708, "step": 1763 }, { "epoch": 0.05, "learning_rate": 4.992984732869512e-06, "loss": 1.13, "step": 1764 }, { "epoch": 0.05, "learning_rate": 4.992966460627606e-06, "loss": 1.0885, "step": 1765 }, { "epoch": 0.05, "learning_rate": 4.992948164653861e-06, "loss": 1.155, "step": 1766 }, { "epoch": 0.05, "learning_rate": 4.992929844948449e-06, "loss": 1.1599, "step": 1767 }, { "epoch": 0.05, "learning_rate": 4.992911501511546e-06, "loss": 1.0884, "step": 1768 }, { "epoch": 0.05, "learning_rate": 4.992893134343327e-06, "loss": 1.2465, "step": 1769 }, { "epoch": 0.05, "learning_rate": 4.992874743443965e-06, "loss": 1.1279, "step": 1770 }, { "epoch": 0.05, "learning_rate": 4.992856328813636e-06, "loss": 1.0395, "step": 1771 }, { "epoch": 0.05, "learning_rate": 4.992837890452515e-06, "loss": 1.1788, "step": 1772 }, { "epoch": 0.05, "learning_rate": 4.992819428360779e-06, "loss": 1.0602, "step": 1773 }, { "epoch": 0.05, "learning_rate": 4.992800942538603e-06, "loss": 1.2147, "step": 1774 }, { "epoch": 0.05, "learning_rate": 4.99278243298616e-06, "loss": 1.1048, "step": 1775 }, { "epoch": 0.05, "learning_rate": 4.9927638997036314e-06, "loss": 1.2137, "step": 1776 }, { "epoch": 0.05, "learning_rate": 4.99274534269119e-06, "loss": 1.1358, "step": 1777 }, { "epoch": 0.05, "learning_rate": 4.992726761949014e-06, "loss": 1.1248, "step": 1778 }, { "epoch": 0.05, "learning_rate": 4.99270815747728e-06, "loss": 1.3333, "step": 1779 }, { "epoch": 0.05, "learning_rate": 4.992689529276163e-06, "loss": 1.2406, "step": 1780 }, { "epoch": 0.05, "learning_rate": 4.992670877345844e-06, "loss": 1.2061, "step": 1781 }, { "epoch": 0.05, "learning_rate": 4.992652201686498e-06, "loss": 1.2119, "step": 1782 }, { "epoch": 0.05, "learning_rate": 4.992633502298304e-06, "loss": 1.1481, "step": 1783 }, { "epoch": 0.05, "learning_rate": 4.992614779181439e-06, "loss": 1.1063, "step": 1784 }, { "epoch": 0.05, "learning_rate": 4.992596032336083e-06, "loss": 1.0818, "step": 1785 }, { "epoch": 0.05, "learning_rate": 4.992577261762412e-06, "loss": 1.1601, "step": 1786 }, { "epoch": 0.05, "learning_rate": 4.992558467460605e-06, "loss": 1.1558, "step": 1787 }, { "epoch": 0.05, "learning_rate": 4.992539649430844e-06, "loss": 1.2151, "step": 1788 }, { "epoch": 0.05, "learning_rate": 4.992520807673305e-06, "loss": 1.1699, "step": 1789 }, { "epoch": 0.05, "learning_rate": 4.992501942188168e-06, "loss": 1.1133, "step": 1790 }, { "epoch": 0.05, "learning_rate": 4.992483052975614e-06, "loss": 1.1204, "step": 1791 }, { "epoch": 0.05, "learning_rate": 4.992464140035821e-06, "loss": 1.2202, "step": 1792 }, { "epoch": 0.05, "learning_rate": 4.99244520336897e-06, "loss": 1.1898, "step": 1793 }, { "epoch": 0.05, "learning_rate": 4.9924262429752415e-06, "loss": 1.226, "step": 1794 }, { "epoch": 0.05, "learning_rate": 4.992407258854814e-06, "loss": 1.1675, "step": 1795 }, { "epoch": 0.05, "learning_rate": 4.992388251007871e-06, "loss": 1.1712, "step": 1796 }, { "epoch": 0.05, "learning_rate": 4.992369219434592e-06, "loss": 1.1633, "step": 1797 }, { "epoch": 0.05, "learning_rate": 4.992350164135159e-06, "loss": 1.182, "step": 1798 }, { "epoch": 0.05, "learning_rate": 4.992331085109751e-06, "loss": 1.1582, "step": 1799 }, { "epoch": 0.05, "learning_rate": 4.992311982358554e-06, "loss": 1.1177, "step": 1800 }, { "epoch": 0.05, "learning_rate": 4.992292855881746e-06, "loss": 1.0875, "step": 1801 }, { "epoch": 0.05, "learning_rate": 4.9922737056795104e-06, "loss": 1.1392, "step": 1802 }, { "epoch": 0.05, "learning_rate": 4.992254531752029e-06, "loss": 1.2073, "step": 1803 }, { "epoch": 0.05, "learning_rate": 4.992235334099485e-06, "loss": 1.1397, "step": 1804 }, { "epoch": 0.05, "learning_rate": 4.992216112722061e-06, "loss": 1.2868, "step": 1805 }, { "epoch": 0.05, "learning_rate": 4.99219686761994e-06, "loss": 1.0015, "step": 1806 }, { "epoch": 0.05, "learning_rate": 4.992177598793305e-06, "loss": 1.1962, "step": 1807 }, { "epoch": 0.05, "learning_rate": 4.99215830624234e-06, "loss": 1.1972, "step": 1808 }, { "epoch": 0.05, "learning_rate": 4.992138989967228e-06, "loss": 1.157, "step": 1809 }, { "epoch": 0.05, "learning_rate": 4.992119649968152e-06, "loss": 1.0169, "step": 1810 }, { "epoch": 0.05, "learning_rate": 4.992100286245299e-06, "loss": 1.1111, "step": 1811 }, { "epoch": 0.05, "learning_rate": 4.99208089879885e-06, "loss": 1.2236, "step": 1812 }, { "epoch": 0.05, "learning_rate": 4.992061487628991e-06, "loss": 1.0386, "step": 1813 }, { "epoch": 0.05, "learning_rate": 4.992042052735908e-06, "loss": 1.1586, "step": 1814 }, { "epoch": 0.05, "learning_rate": 4.992022594119784e-06, "loss": 1.2238, "step": 1815 }, { "epoch": 0.05, "learning_rate": 4.992003111780806e-06, "loss": 1.0806, "step": 1816 }, { "epoch": 0.05, "learning_rate": 4.991983605719158e-06, "loss": 1.1262, "step": 1817 }, { "epoch": 0.05, "learning_rate": 4.991964075935025e-06, "loss": 1.2547, "step": 1818 }, { "epoch": 0.05, "learning_rate": 4.991944522428595e-06, "loss": 1.24, "step": 1819 }, { "epoch": 0.05, "learning_rate": 4.9919249452000545e-06, "loss": 1.2107, "step": 1820 }, { "epoch": 0.05, "learning_rate": 4.991905344249588e-06, "loss": 1.208, "step": 1821 }, { "epoch": 0.05, "learning_rate": 4.9918857195773825e-06, "loss": 1.1254, "step": 1822 }, { "epoch": 0.05, "learning_rate": 4.991866071183626e-06, "loss": 1.1178, "step": 1823 }, { "epoch": 0.05, "learning_rate": 4.991846399068503e-06, "loss": 1.2797, "step": 1824 }, { "epoch": 0.05, "learning_rate": 4.991826703232203e-06, "loss": 1.1245, "step": 1825 }, { "epoch": 0.06, "learning_rate": 4.991806983674914e-06, "loss": 1.1855, "step": 1826 }, { "epoch": 0.06, "learning_rate": 4.991787240396822e-06, "loss": 1.0915, "step": 1827 }, { "epoch": 0.06, "learning_rate": 4.991767473398115e-06, "loss": 1.0463, "step": 1828 }, { "epoch": 0.06, "learning_rate": 4.9917476826789816e-06, "loss": 1.0316, "step": 1829 }, { "epoch": 0.06, "learning_rate": 4.991727868239611e-06, "loss": 1.184, "step": 1830 }, { "epoch": 0.06, "learning_rate": 4.991708030080191e-06, "loss": 1.1977, "step": 1831 }, { "epoch": 0.06, "learning_rate": 4.99168816820091e-06, "loss": 1.1993, "step": 1832 }, { "epoch": 0.06, "learning_rate": 4.991668282601958e-06, "loss": 1.0783, "step": 1833 }, { "epoch": 0.06, "learning_rate": 4.991648373283525e-06, "loss": 1.192, "step": 1834 }, { "epoch": 0.06, "learning_rate": 4.991628440245798e-06, "loss": 1.2295, "step": 1835 }, { "epoch": 0.06, "learning_rate": 4.991608483488969e-06, "loss": 1.1897, "step": 1836 }, { "epoch": 0.06, "learning_rate": 4.991588503013227e-06, "loss": 1.1386, "step": 1837 }, { "epoch": 0.06, "learning_rate": 4.991568498818763e-06, "loss": 1.142, "step": 1838 }, { "epoch": 0.06, "learning_rate": 4.9915484709057665e-06, "loss": 1.1813, "step": 1839 }, { "epoch": 0.06, "learning_rate": 4.991528419274429e-06, "loss": 1.1105, "step": 1840 }, { "epoch": 0.06, "learning_rate": 4.99150834392494e-06, "loss": 1.2478, "step": 1841 }, { "epoch": 0.06, "learning_rate": 4.991488244857492e-06, "loss": 1.2432, "step": 1842 }, { "epoch": 0.06, "learning_rate": 4.991468122072276e-06, "loss": 1.282, "step": 1843 }, { "epoch": 0.06, "learning_rate": 4.9914479755694825e-06, "loss": 1.217, "step": 1844 }, { "epoch": 0.06, "learning_rate": 4.9914278053493055e-06, "loss": 1.0934, "step": 1845 }, { "epoch": 0.06, "learning_rate": 4.991407611411935e-06, "loss": 1.1908, "step": 1846 }, { "epoch": 0.06, "learning_rate": 4.991387393757564e-06, "loss": 1.1635, "step": 1847 }, { "epoch": 0.06, "learning_rate": 4.991367152386385e-06, "loss": 1.1462, "step": 1848 }, { "epoch": 0.06, "learning_rate": 4.9913468872985905e-06, "loss": 1.1096, "step": 1849 }, { "epoch": 0.06, "learning_rate": 4.991326598494373e-06, "loss": 1.2751, "step": 1850 }, { "epoch": 0.06, "learning_rate": 4.991306285973927e-06, "loss": 1.1738, "step": 1851 }, { "epoch": 0.06, "learning_rate": 4.991285949737445e-06, "loss": 1.0478, "step": 1852 }, { "epoch": 0.06, "learning_rate": 4.99126558978512e-06, "loss": 1.1918, "step": 1853 }, { "epoch": 0.06, "learning_rate": 4.991245206117147e-06, "loss": 1.2594, "step": 1854 }, { "epoch": 0.06, "learning_rate": 4.9912247987337195e-06, "loss": 1.0857, "step": 1855 }, { "epoch": 0.06, "learning_rate": 4.991204367635031e-06, "loss": 1.3604, "step": 1856 }, { "epoch": 0.06, "learning_rate": 4.991183912821277e-06, "loss": 1.2059, "step": 1857 }, { "epoch": 0.06, "learning_rate": 4.991163434292652e-06, "loss": 1.1129, "step": 1858 }, { "epoch": 0.06, "learning_rate": 4.991142932049351e-06, "loss": 1.1208, "step": 1859 }, { "epoch": 0.06, "learning_rate": 4.991122406091569e-06, "loss": 1.1471, "step": 1860 }, { "epoch": 0.06, "learning_rate": 4.991101856419502e-06, "loss": 1.1185, "step": 1861 }, { "epoch": 0.06, "learning_rate": 4.991081283033345e-06, "loss": 1.1464, "step": 1862 }, { "epoch": 0.06, "learning_rate": 4.991060685933293e-06, "loss": 1.0615, "step": 1863 }, { "epoch": 0.06, "learning_rate": 4.9910400651195436e-06, "loss": 1.207, "step": 1864 }, { "epoch": 0.06, "learning_rate": 4.991019420592293e-06, "loss": 1.1184, "step": 1865 }, { "epoch": 0.06, "learning_rate": 4.990998752351735e-06, "loss": 1.1034, "step": 1866 }, { "epoch": 0.06, "learning_rate": 4.990978060398071e-06, "loss": 1.1022, "step": 1867 }, { "epoch": 0.06, "learning_rate": 4.9909573447314955e-06, "loss": 1.2406, "step": 1868 }, { "epoch": 0.06, "learning_rate": 4.990936605352204e-06, "loss": 1.2224, "step": 1869 }, { "epoch": 0.06, "learning_rate": 4.990915842260398e-06, "loss": 1.1685, "step": 1870 }, { "epoch": 0.06, "learning_rate": 4.990895055456271e-06, "loss": 1.0631, "step": 1871 }, { "epoch": 0.06, "learning_rate": 4.990874244940023e-06, "loss": 1.1515, "step": 1872 }, { "epoch": 0.06, "learning_rate": 4.9908534107118525e-06, "loss": 1.2278, "step": 1873 }, { "epoch": 0.06, "learning_rate": 4.990832552771957e-06, "loss": 1.2804, "step": 1874 }, { "epoch": 0.06, "learning_rate": 4.990811671120535e-06, "loss": 1.2511, "step": 1875 }, { "epoch": 0.06, "learning_rate": 4.990790765757785e-06, "loss": 1.1488, "step": 1876 }, { "epoch": 0.06, "learning_rate": 4.990769836683907e-06, "loss": 1.0787, "step": 1877 }, { "epoch": 0.06, "learning_rate": 4.9907488838991e-06, "loss": 1.0507, "step": 1878 }, { "epoch": 0.06, "learning_rate": 4.990727907403563e-06, "loss": 1.2288, "step": 1879 }, { "epoch": 0.06, "learning_rate": 4.990706907197497e-06, "loss": 1.215, "step": 1880 }, { "epoch": 0.06, "learning_rate": 4.990685883281099e-06, "loss": 1.152, "step": 1881 }, { "epoch": 0.06, "learning_rate": 4.990664835654572e-06, "loss": 1.2483, "step": 1882 }, { "epoch": 0.06, "learning_rate": 4.990643764318115e-06, "loss": 1.264, "step": 1883 }, { "epoch": 0.06, "learning_rate": 4.990622669271928e-06, "loss": 1.1669, "step": 1884 }, { "epoch": 0.06, "learning_rate": 4.990601550516214e-06, "loss": 1.2172, "step": 1885 }, { "epoch": 0.06, "learning_rate": 4.990580408051173e-06, "loss": 1.194, "step": 1886 }, { "epoch": 0.06, "learning_rate": 4.990559241877005e-06, "loss": 1.2091, "step": 1887 }, { "epoch": 0.06, "learning_rate": 4.990538051993913e-06, "loss": 1.1351, "step": 1888 }, { "epoch": 0.06, "learning_rate": 4.990516838402099e-06, "loss": 1.1061, "step": 1889 }, { "epoch": 0.06, "learning_rate": 4.990495601101762e-06, "loss": 1.1444, "step": 1890 }, { "epoch": 0.06, "learning_rate": 4.990474340093108e-06, "loss": 1.147, "step": 1891 }, { "epoch": 0.06, "learning_rate": 4.990453055376337e-06, "loss": 1.1416, "step": 1892 }, { "epoch": 0.06, "learning_rate": 4.990431746951654e-06, "loss": 1.3163, "step": 1893 }, { "epoch": 0.06, "learning_rate": 4.990410414819258e-06, "loss": 1.1438, "step": 1894 }, { "epoch": 0.06, "learning_rate": 4.990389058979356e-06, "loss": 1.2422, "step": 1895 }, { "epoch": 0.06, "learning_rate": 4.9903676794321484e-06, "loss": 1.2457, "step": 1896 }, { "epoch": 0.06, "learning_rate": 4.99034627617784e-06, "loss": 1.1146, "step": 1897 }, { "epoch": 0.06, "learning_rate": 4.990324849216635e-06, "loss": 1.1113, "step": 1898 }, { "epoch": 0.06, "learning_rate": 4.990303398548736e-06, "loss": 1.1888, "step": 1899 }, { "epoch": 0.06, "learning_rate": 4.990281924174349e-06, "loss": 1.1556, "step": 1900 }, { "epoch": 0.06, "learning_rate": 4.990260426093677e-06, "loss": 1.1411, "step": 1901 }, { "epoch": 0.06, "learning_rate": 4.9902389043069255e-06, "loss": 1.1866, "step": 1902 }, { "epoch": 0.06, "learning_rate": 4.990217358814298e-06, "loss": 1.1622, "step": 1903 }, { "epoch": 0.06, "learning_rate": 4.990195789616001e-06, "loss": 1.1802, "step": 1904 }, { "epoch": 0.06, "learning_rate": 4.99017419671224e-06, "loss": 1.1766, "step": 1905 }, { "epoch": 0.06, "learning_rate": 4.990152580103219e-06, "loss": 1.1871, "step": 1906 }, { "epoch": 0.06, "learning_rate": 4.9901309397891454e-06, "loss": 1.0873, "step": 1907 }, { "epoch": 0.06, "learning_rate": 4.990109275770225e-06, "loss": 1.1981, "step": 1908 }, { "epoch": 0.06, "learning_rate": 4.990087588046662e-06, "loss": 1.1417, "step": 1909 }, { "epoch": 0.06, "learning_rate": 4.990065876618666e-06, "loss": 1.1264, "step": 1910 }, { "epoch": 0.06, "learning_rate": 4.990044141486441e-06, "loss": 1.3105, "step": 1911 }, { "epoch": 0.06, "learning_rate": 4.990022382650196e-06, "loss": 1.0682, "step": 1912 }, { "epoch": 0.06, "learning_rate": 4.9900006001101364e-06, "loss": 1.1171, "step": 1913 }, { "epoch": 0.06, "learning_rate": 4.989978793866472e-06, "loss": 1.0682, "step": 1914 }, { "epoch": 0.06, "learning_rate": 4.989956963919406e-06, "loss": 1.0899, "step": 1915 }, { "epoch": 0.06, "learning_rate": 4.989935110269151e-06, "loss": 1.2227, "step": 1916 }, { "epoch": 0.06, "learning_rate": 4.989913232915912e-06, "loss": 1.2773, "step": 1917 }, { "epoch": 0.06, "learning_rate": 4.989891331859897e-06, "loss": 1.1799, "step": 1918 }, { "epoch": 0.06, "learning_rate": 4.989869407101318e-06, "loss": 1.1683, "step": 1919 }, { "epoch": 0.06, "learning_rate": 4.98984745864038e-06, "loss": 1.238, "step": 1920 }, { "epoch": 0.06, "learning_rate": 4.989825486477294e-06, "loss": 1.2238, "step": 1921 }, { "epoch": 0.06, "learning_rate": 4.989803490612268e-06, "loss": 1.2483, "step": 1922 }, { "epoch": 0.06, "learning_rate": 4.989781471045513e-06, "loss": 1.1865, "step": 1923 }, { "epoch": 0.06, "learning_rate": 4.989759427777237e-06, "loss": 1.1711, "step": 1924 }, { "epoch": 0.06, "learning_rate": 4.989737360807649e-06, "loss": 1.175, "step": 1925 }, { "epoch": 0.06, "learning_rate": 4.989715270136961e-06, "loss": 1.175, "step": 1926 }, { "epoch": 0.06, "learning_rate": 4.989693155765384e-06, "loss": 1.0892, "step": 1927 }, { "epoch": 0.06, "learning_rate": 4.989671017693126e-06, "loss": 1.0696, "step": 1928 }, { "epoch": 0.06, "learning_rate": 4.9896488559204e-06, "loss": 1.2998, "step": 1929 }, { "epoch": 0.06, "learning_rate": 4.989626670447415e-06, "loss": 1.2631, "step": 1930 }, { "epoch": 0.06, "learning_rate": 4.989604461274384e-06, "loss": 1.3171, "step": 1931 }, { "epoch": 0.06, "learning_rate": 4.989582228401517e-06, "loss": 1.16, "step": 1932 }, { "epoch": 0.06, "learning_rate": 4.989559971829026e-06, "loss": 1.1606, "step": 1933 }, { "epoch": 0.06, "learning_rate": 4.989537691557124e-06, "loss": 1.0742, "step": 1934 }, { "epoch": 0.06, "learning_rate": 4.989515387586022e-06, "loss": 1.1476, "step": 1935 }, { "epoch": 0.06, "learning_rate": 4.989493059915931e-06, "loss": 1.2321, "step": 1936 }, { "epoch": 0.06, "learning_rate": 4.989470708547066e-06, "loss": 1.2372, "step": 1937 }, { "epoch": 0.06, "learning_rate": 4.989448333479639e-06, "loss": 1.1469, "step": 1938 }, { "epoch": 0.06, "learning_rate": 4.989425934713863e-06, "loss": 1.0983, "step": 1939 }, { "epoch": 0.06, "learning_rate": 4.989403512249951e-06, "loss": 1.1199, "step": 1940 }, { "epoch": 0.06, "learning_rate": 4.989381066088116e-06, "loss": 1.1314, "step": 1941 }, { "epoch": 0.06, "learning_rate": 4.989358596228572e-06, "loss": 1.2166, "step": 1942 }, { "epoch": 0.06, "learning_rate": 4.989336102671533e-06, "loss": 1.1805, "step": 1943 }, { "epoch": 0.06, "learning_rate": 4.989313585417215e-06, "loss": 1.2549, "step": 1944 }, { "epoch": 0.06, "learning_rate": 4.989291044465829e-06, "loss": 1.2523, "step": 1945 }, { "epoch": 0.06, "learning_rate": 4.989268479817591e-06, "loss": 1.1691, "step": 1946 }, { "epoch": 0.06, "learning_rate": 4.989245891472717e-06, "loss": 1.1789, "step": 1947 }, { "epoch": 0.06, "learning_rate": 4.98922327943142e-06, "loss": 1.1942, "step": 1948 }, { "epoch": 0.06, "learning_rate": 4.989200643693917e-06, "loss": 1.1624, "step": 1949 }, { "epoch": 0.06, "learning_rate": 4.989177984260422e-06, "loss": 1.1586, "step": 1950 }, { "epoch": 0.06, "learning_rate": 4.989155301131152e-06, "loss": 1.1024, "step": 1951 }, { "epoch": 0.06, "learning_rate": 4.9891325943063215e-06, "loss": 1.2128, "step": 1952 }, { "epoch": 0.06, "learning_rate": 4.989109863786148e-06, "loss": 1.1095, "step": 1953 }, { "epoch": 0.06, "learning_rate": 4.9890871095708485e-06, "loss": 1.0652, "step": 1954 }, { "epoch": 0.06, "learning_rate": 4.989064331660637e-06, "loss": 1.2979, "step": 1955 }, { "epoch": 0.06, "learning_rate": 4.989041530055733e-06, "loss": 1.1725, "step": 1956 }, { "epoch": 0.06, "learning_rate": 4.989018704756351e-06, "loss": 1.0879, "step": 1957 }, { "epoch": 0.06, "learning_rate": 4.988995855762711e-06, "loss": 1.1053, "step": 1958 }, { "epoch": 0.06, "learning_rate": 4.9889729830750284e-06, "loss": 1.1122, "step": 1959 }, { "epoch": 0.06, "learning_rate": 4.988950086693521e-06, "loss": 1.2218, "step": 1960 }, { "epoch": 0.06, "learning_rate": 4.988927166618409e-06, "loss": 1.1768, "step": 1961 }, { "epoch": 0.06, "learning_rate": 4.988904222849909e-06, "loss": 1.3022, "step": 1962 }, { "epoch": 0.06, "learning_rate": 4.9888812553882385e-06, "loss": 1.1634, "step": 1963 }, { "epoch": 0.06, "learning_rate": 4.9888582642336185e-06, "loss": 1.2872, "step": 1964 }, { "epoch": 0.06, "learning_rate": 4.9888352493862655e-06, "loss": 1.0566, "step": 1965 }, { "epoch": 0.06, "learning_rate": 4.988812210846399e-06, "loss": 1.1961, "step": 1966 }, { "epoch": 0.06, "learning_rate": 4.98878914861424e-06, "loss": 1.2167, "step": 1967 }, { "epoch": 0.06, "learning_rate": 4.988766062690006e-06, "loss": 1.2092, "step": 1968 }, { "epoch": 0.06, "learning_rate": 4.9887429530739185e-06, "loss": 1.1915, "step": 1969 }, { "epoch": 0.06, "learning_rate": 4.9887198197661966e-06, "loss": 1.2217, "step": 1970 }, { "epoch": 0.06, "learning_rate": 4.9886966627670605e-06, "loss": 1.1559, "step": 1971 }, { "epoch": 0.06, "learning_rate": 4.988673482076731e-06, "loss": 1.0035, "step": 1972 }, { "epoch": 0.06, "learning_rate": 4.988650277695429e-06, "loss": 1.1774, "step": 1973 }, { "epoch": 0.06, "learning_rate": 4.988627049623373e-06, "loss": 1.1968, "step": 1974 }, { "epoch": 0.06, "learning_rate": 4.988603797860788e-06, "loss": 1.0595, "step": 1975 }, { "epoch": 0.06, "learning_rate": 4.988580522407893e-06, "loss": 1.1901, "step": 1976 }, { "epoch": 0.06, "learning_rate": 4.988557223264909e-06, "loss": 1.1543, "step": 1977 }, { "epoch": 0.06, "learning_rate": 4.98853390043206e-06, "loss": 1.2415, "step": 1978 }, { "epoch": 0.06, "learning_rate": 4.988510553909566e-06, "loss": 1.2595, "step": 1979 }, { "epoch": 0.06, "learning_rate": 4.98848718369765e-06, "loss": 1.178, "step": 1980 }, { "epoch": 0.06, "learning_rate": 4.988463789796535e-06, "loss": 1.2241, "step": 1981 }, { "epoch": 0.06, "learning_rate": 4.988440372206443e-06, "loss": 1.2849, "step": 1982 }, { "epoch": 0.06, "learning_rate": 4.988416930927597e-06, "loss": 1.158, "step": 1983 }, { "epoch": 0.06, "learning_rate": 4.988393465960221e-06, "loss": 1.1897, "step": 1984 }, { "epoch": 0.06, "learning_rate": 4.9883699773045365e-06, "loss": 1.2605, "step": 1985 }, { "epoch": 0.06, "learning_rate": 4.988346464960769e-06, "loss": 1.14, "step": 1986 }, { "epoch": 0.06, "learning_rate": 4.988322928929141e-06, "loss": 1.0616, "step": 1987 }, { "epoch": 0.06, "learning_rate": 4.988299369209878e-06, "loss": 1.113, "step": 1988 }, { "epoch": 0.06, "learning_rate": 4.988275785803203e-06, "loss": 1.1251, "step": 1989 }, { "epoch": 0.06, "learning_rate": 4.988252178709341e-06, "loss": 1.2095, "step": 1990 }, { "epoch": 0.06, "learning_rate": 4.988228547928516e-06, "loss": 1.1732, "step": 1991 }, { "epoch": 0.06, "learning_rate": 4.988204893460954e-06, "loss": 1.2094, "step": 1992 }, { "epoch": 0.06, "learning_rate": 4.98818121530688e-06, "loss": 1.3403, "step": 1993 }, { "epoch": 0.06, "learning_rate": 4.98815751346652e-06, "loss": 1.1157, "step": 1994 }, { "epoch": 0.06, "learning_rate": 4.988133787940097e-06, "loss": 1.0797, "step": 1995 }, { "epoch": 0.06, "learning_rate": 4.98811003872784e-06, "loss": 1.1405, "step": 1996 }, { "epoch": 0.06, "learning_rate": 4.988086265829973e-06, "loss": 1.0806, "step": 1997 }, { "epoch": 0.06, "learning_rate": 4.988062469246724e-06, "loss": 1.1907, "step": 1998 }, { "epoch": 0.06, "learning_rate": 4.988038648978317e-06, "loss": 1.2792, "step": 1999 }, { "epoch": 0.06, "learning_rate": 4.988014805024981e-06, "loss": 1.185, "step": 2000 }, { "epoch": 0.06, "learning_rate": 4.987990937386942e-06, "loss": 1.0763, "step": 2001 }, { "epoch": 0.06, "learning_rate": 4.987967046064429e-06, "loss": 1.0901, "step": 2002 }, { "epoch": 0.06, "learning_rate": 4.987943131057668e-06, "loss": 1.1668, "step": 2003 }, { "epoch": 0.06, "learning_rate": 4.987919192366885e-06, "loss": 1.1404, "step": 2004 }, { "epoch": 0.06, "learning_rate": 4.98789522999231e-06, "loss": 1.1703, "step": 2005 }, { "epoch": 0.06, "learning_rate": 4.9878712439341716e-06, "loss": 1.2279, "step": 2006 }, { "epoch": 0.06, "learning_rate": 4.987847234192696e-06, "loss": 1.2134, "step": 2007 }, { "epoch": 0.06, "learning_rate": 4.987823200768113e-06, "loss": 1.1408, "step": 2008 }, { "epoch": 0.06, "learning_rate": 4.987799143660652e-06, "loss": 1.1118, "step": 2009 }, { "epoch": 0.06, "learning_rate": 4.987775062870541e-06, "loss": 1.1886, "step": 2010 }, { "epoch": 0.06, "learning_rate": 4.987750958398009e-06, "loss": 1.2009, "step": 2011 }, { "epoch": 0.06, "learning_rate": 4.987726830243287e-06, "loss": 1.0886, "step": 2012 }, { "epoch": 0.06, "learning_rate": 4.987702678406603e-06, "loss": 1.1173, "step": 2013 }, { "epoch": 0.06, "learning_rate": 4.987678502888188e-06, "loss": 1.149, "step": 2014 }, { "epoch": 0.06, "learning_rate": 4.9876543036882715e-06, "loss": 1.1453, "step": 2015 }, { "epoch": 0.06, "learning_rate": 4.9876300808070845e-06, "loss": 1.1866, "step": 2016 }, { "epoch": 0.06, "learning_rate": 4.987605834244856e-06, "loss": 1.2305, "step": 2017 }, { "epoch": 0.06, "learning_rate": 4.987581564001819e-06, "loss": 1.2609, "step": 2018 }, { "epoch": 0.06, "learning_rate": 4.987557270078204e-06, "loss": 1.0944, "step": 2019 }, { "epoch": 0.06, "learning_rate": 4.987532952474241e-06, "loss": 1.2349, "step": 2020 }, { "epoch": 0.06, "learning_rate": 4.987508611190162e-06, "loss": 1.1116, "step": 2021 }, { "epoch": 0.06, "learning_rate": 4.987484246226201e-06, "loss": 1.1808, "step": 2022 }, { "epoch": 0.06, "learning_rate": 4.987459857582586e-06, "loss": 1.0766, "step": 2023 }, { "epoch": 0.06, "learning_rate": 4.9874354452595525e-06, "loss": 1.3002, "step": 2024 }, { "epoch": 0.06, "learning_rate": 4.987411009257331e-06, "loss": 1.2611, "step": 2025 }, { "epoch": 0.06, "learning_rate": 4.9873865495761545e-06, "loss": 1.122, "step": 2026 }, { "epoch": 0.06, "learning_rate": 4.987362066216256e-06, "loss": 1.1747, "step": 2027 }, { "epoch": 0.06, "learning_rate": 4.9873375591778685e-06, "loss": 1.1384, "step": 2028 }, { "epoch": 0.06, "learning_rate": 4.987313028461226e-06, "loss": 1.2748, "step": 2029 }, { "epoch": 0.06, "learning_rate": 4.987288474066561e-06, "loss": 1.1407, "step": 2030 }, { "epoch": 0.06, "learning_rate": 4.987263895994108e-06, "loss": 1.0835, "step": 2031 }, { "epoch": 0.06, "learning_rate": 4.9872392942440995e-06, "loss": 1.1104, "step": 2032 }, { "epoch": 0.06, "learning_rate": 4.987214668816772e-06, "loss": 1.1531, "step": 2033 }, { "epoch": 0.06, "learning_rate": 4.987190019712358e-06, "loss": 1.1643, "step": 2034 }, { "epoch": 0.06, "learning_rate": 4.987165346931093e-06, "loss": 1.2318, "step": 2035 }, { "epoch": 0.06, "learning_rate": 4.987140650473213e-06, "loss": 1.1873, "step": 2036 }, { "epoch": 0.06, "learning_rate": 4.9871159303389504e-06, "loss": 1.1844, "step": 2037 }, { "epoch": 0.06, "learning_rate": 4.987091186528542e-06, "loss": 1.2528, "step": 2038 }, { "epoch": 0.06, "learning_rate": 4.987066419042223e-06, "loss": 1.2693, "step": 2039 }, { "epoch": 0.06, "learning_rate": 4.987041627880232e-06, "loss": 1.1809, "step": 2040 }, { "epoch": 0.06, "learning_rate": 4.9870168130427995e-06, "loss": 1.2167, "step": 2041 }, { "epoch": 0.06, "learning_rate": 4.986991974530166e-06, "loss": 1.2649, "step": 2042 }, { "epoch": 0.06, "learning_rate": 4.986967112342566e-06, "loss": 1.2572, "step": 2043 }, { "epoch": 0.06, "learning_rate": 4.986942226480238e-06, "loss": 1.1671, "step": 2044 }, { "epoch": 0.06, "learning_rate": 4.986917316943418e-06, "loss": 1.175, "step": 2045 }, { "epoch": 0.06, "learning_rate": 4.986892383732342e-06, "loss": 1.1857, "step": 2046 }, { "epoch": 0.06, "learning_rate": 4.986867426847248e-06, "loss": 1.1923, "step": 2047 }, { "epoch": 0.06, "learning_rate": 4.986842446288374e-06, "loss": 1.1912, "step": 2048 }, { "epoch": 0.06, "learning_rate": 4.986817442055958e-06, "loss": 1.1512, "step": 2049 }, { "epoch": 0.06, "learning_rate": 4.9867924141502374e-06, "loss": 1.1989, "step": 2050 }, { "epoch": 0.06, "learning_rate": 4.986767362571451e-06, "loss": 1.1809, "step": 2051 }, { "epoch": 0.06, "learning_rate": 4.986742287319837e-06, "loss": 1.1304, "step": 2052 }, { "epoch": 0.06, "learning_rate": 4.986717188395633e-06, "loss": 1.0994, "step": 2053 }, { "epoch": 0.06, "learning_rate": 4.98669206579908e-06, "loss": 1.1455, "step": 2054 }, { "epoch": 0.06, "learning_rate": 4.986666919530416e-06, "loss": 1.2406, "step": 2055 }, { "epoch": 0.06, "learning_rate": 4.986641749589881e-06, "loss": 1.1901, "step": 2056 }, { "epoch": 0.06, "learning_rate": 4.986616555977714e-06, "loss": 1.251, "step": 2057 }, { "epoch": 0.06, "learning_rate": 4.986591338694154e-06, "loss": 1.1047, "step": 2058 }, { "epoch": 0.06, "learning_rate": 4.986566097739443e-06, "loss": 1.1118, "step": 2059 }, { "epoch": 0.06, "learning_rate": 4.98654083311382e-06, "loss": 1.0846, "step": 2060 }, { "epoch": 0.06, "learning_rate": 4.986515544817525e-06, "loss": 1.1268, "step": 2061 }, { "epoch": 0.06, "learning_rate": 4.986490232850801e-06, "loss": 1.1962, "step": 2062 }, { "epoch": 0.06, "learning_rate": 4.9864648972138865e-06, "loss": 1.1804, "step": 2063 }, { "epoch": 0.06, "learning_rate": 4.986439537907024e-06, "loss": 1.1846, "step": 2064 }, { "epoch": 0.06, "learning_rate": 4.986414154930455e-06, "loss": 1.0468, "step": 2065 }, { "epoch": 0.06, "learning_rate": 4.986388748284421e-06, "loss": 1.1806, "step": 2066 }, { "epoch": 0.06, "learning_rate": 4.9863633179691624e-06, "loss": 1.2271, "step": 2067 }, { "epoch": 0.06, "learning_rate": 4.986337863984924e-06, "loss": 1.2532, "step": 2068 }, { "epoch": 0.06, "learning_rate": 4.986312386331945e-06, "loss": 1.1546, "step": 2069 }, { "epoch": 0.06, "learning_rate": 4.986286885010471e-06, "loss": 1.2103, "step": 2070 }, { "epoch": 0.06, "learning_rate": 4.986261360020742e-06, "loss": 1.1544, "step": 2071 }, { "epoch": 0.06, "learning_rate": 4.986235811363003e-06, "loss": 1.1726, "step": 2072 }, { "epoch": 0.06, "learning_rate": 4.986210239037496e-06, "loss": 1.0778, "step": 2073 }, { "epoch": 0.06, "learning_rate": 4.986184643044465e-06, "loss": 1.0168, "step": 2074 }, { "epoch": 0.06, "learning_rate": 4.986159023384154e-06, "loss": 1.1907, "step": 2075 }, { "epoch": 0.06, "learning_rate": 4.986133380056807e-06, "loss": 1.2898, "step": 2076 }, { "epoch": 0.06, "learning_rate": 4.986107713062667e-06, "loss": 1.1855, "step": 2077 }, { "epoch": 0.06, "learning_rate": 4.986082022401978e-06, "loss": 1.1355, "step": 2078 }, { "epoch": 0.06, "learning_rate": 4.986056308074987e-06, "loss": 1.1967, "step": 2079 }, { "epoch": 0.06, "learning_rate": 4.986030570081936e-06, "loss": 1.1772, "step": 2080 }, { "epoch": 0.06, "learning_rate": 4.986004808423072e-06, "loss": 1.2101, "step": 2081 }, { "epoch": 0.06, "learning_rate": 4.9859790230986396e-06, "loss": 1.0864, "step": 2082 }, { "epoch": 0.06, "learning_rate": 4.985953214108884e-06, "loss": 1.0322, "step": 2083 }, { "epoch": 0.06, "learning_rate": 4.985927381454051e-06, "loss": 1.1594, "step": 2084 }, { "epoch": 0.06, "learning_rate": 4.985901525134386e-06, "loss": 1.2071, "step": 2085 }, { "epoch": 0.06, "learning_rate": 4.985875645150137e-06, "loss": 1.2257, "step": 2086 }, { "epoch": 0.06, "learning_rate": 4.985849741501548e-06, "loss": 1.1998, "step": 2087 }, { "epoch": 0.06, "learning_rate": 4.985823814188868e-06, "loss": 1.1614, "step": 2088 }, { "epoch": 0.06, "learning_rate": 4.985797863212342e-06, "loss": 1.3022, "step": 2089 }, { "epoch": 0.06, "learning_rate": 4.985771888572216e-06, "loss": 1.0962, "step": 2090 }, { "epoch": 0.06, "learning_rate": 4.9857458902687405e-06, "loss": 1.2693, "step": 2091 }, { "epoch": 0.06, "learning_rate": 4.98571986830216e-06, "loss": 1.3082, "step": 2092 }, { "epoch": 0.06, "learning_rate": 4.985693822672725e-06, "loss": 1.138, "step": 2093 }, { "epoch": 0.06, "learning_rate": 4.985667753380681e-06, "loss": 1.2204, "step": 2094 }, { "epoch": 0.06, "learning_rate": 4.985641660426278e-06, "loss": 1.1172, "step": 2095 }, { "epoch": 0.06, "learning_rate": 4.985615543809763e-06, "loss": 1.2186, "step": 2096 }, { "epoch": 0.06, "learning_rate": 4.985589403531384e-06, "loss": 1.1763, "step": 2097 }, { "epoch": 0.06, "learning_rate": 4.985563239591394e-06, "loss": 1.2863, "step": 2098 }, { "epoch": 0.06, "learning_rate": 4.985537051990036e-06, "loss": 1.1529, "step": 2099 }, { "epoch": 0.06, "learning_rate": 4.9855108407275635e-06, "loss": 1.0938, "step": 2100 }, { "epoch": 0.06, "learning_rate": 4.985484605804225e-06, "loss": 1.1229, "step": 2101 }, { "epoch": 0.06, "learning_rate": 4.98545834722027e-06, "loss": 1.1588, "step": 2102 }, { "epoch": 0.06, "learning_rate": 4.985432064975948e-06, "loss": 1.1784, "step": 2103 }, { "epoch": 0.06, "learning_rate": 4.985405759071511e-06, "loss": 1.1328, "step": 2104 }, { "epoch": 0.06, "learning_rate": 4.985379429507206e-06, "loss": 1.1092, "step": 2105 }, { "epoch": 0.06, "learning_rate": 4.985353076283288e-06, "loss": 1.2693, "step": 2106 }, { "epoch": 0.06, "learning_rate": 4.985326699400005e-06, "loss": 1.2052, "step": 2107 }, { "epoch": 0.06, "learning_rate": 4.9853002988576085e-06, "loss": 1.123, "step": 2108 }, { "epoch": 0.06, "learning_rate": 4.985273874656351e-06, "loss": 1.1243, "step": 2109 }, { "epoch": 0.06, "learning_rate": 4.985247426796482e-06, "loss": 1.2427, "step": 2110 }, { "epoch": 0.06, "learning_rate": 4.9852209552782554e-06, "loss": 1.1003, "step": 2111 }, { "epoch": 0.06, "learning_rate": 4.985194460101922e-06, "loss": 1.1159, "step": 2112 }, { "epoch": 0.06, "learning_rate": 4.985167941267733e-06, "loss": 1.1535, "step": 2113 }, { "epoch": 0.06, "learning_rate": 4.9851413987759435e-06, "loss": 1.1869, "step": 2114 }, { "epoch": 0.06, "learning_rate": 4.985114832626805e-06, "loss": 1.2016, "step": 2115 }, { "epoch": 0.06, "learning_rate": 4.985088242820569e-06, "loss": 1.1417, "step": 2116 }, { "epoch": 0.06, "learning_rate": 4.985061629357491e-06, "loss": 1.1628, "step": 2117 }, { "epoch": 0.06, "learning_rate": 4.985034992237823e-06, "loss": 1.1791, "step": 2118 }, { "epoch": 0.06, "learning_rate": 4.985008331461817e-06, "loss": 1.1371, "step": 2119 }, { "epoch": 0.06, "learning_rate": 4.984981647029731e-06, "loss": 1.2222, "step": 2120 }, { "epoch": 0.06, "learning_rate": 4.984954938941815e-06, "loss": 1.183, "step": 2121 }, { "epoch": 0.06, "learning_rate": 4.984928207198325e-06, "loss": 1.2257, "step": 2122 }, { "epoch": 0.06, "learning_rate": 4.984901451799515e-06, "loss": 1.2455, "step": 2123 }, { "epoch": 0.06, "learning_rate": 4.98487467274564e-06, "loss": 1.1484, "step": 2124 }, { "epoch": 0.06, "learning_rate": 4.9848478700369555e-06, "loss": 1.1837, "step": 2125 }, { "epoch": 0.06, "learning_rate": 4.984821043673715e-06, "loss": 1.2218, "step": 2126 }, { "epoch": 0.06, "learning_rate": 4.984794193656176e-06, "loss": 1.1821, "step": 2127 }, { "epoch": 0.06, "learning_rate": 4.984767319984593e-06, "loss": 1.1774, "step": 2128 }, { "epoch": 0.06, "learning_rate": 4.984740422659221e-06, "loss": 1.0772, "step": 2129 }, { "epoch": 0.06, "learning_rate": 4.984713501680317e-06, "loss": 1.2188, "step": 2130 }, { "epoch": 0.06, "learning_rate": 4.984686557048137e-06, "loss": 1.2906, "step": 2131 }, { "epoch": 0.06, "learning_rate": 4.984659588762938e-06, "loss": 1.145, "step": 2132 }, { "epoch": 0.06, "learning_rate": 4.984632596824977e-06, "loss": 1.1139, "step": 2133 }, { "epoch": 0.06, "learning_rate": 4.98460558123451e-06, "loss": 1.2003, "step": 2134 }, { "epoch": 0.06, "learning_rate": 4.984578541991794e-06, "loss": 1.1884, "step": 2135 }, { "epoch": 0.06, "learning_rate": 4.9845514790970864e-06, "loss": 1.1524, "step": 2136 }, { "epoch": 0.06, "learning_rate": 4.984524392550646e-06, "loss": 1.298, "step": 2137 }, { "epoch": 0.06, "learning_rate": 4.9844972823527295e-06, "loss": 1.1504, "step": 2138 }, { "epoch": 0.06, "learning_rate": 4.984470148503596e-06, "loss": 1.1605, "step": 2139 }, { "epoch": 0.06, "learning_rate": 4.984442991003503e-06, "loss": 1.2095, "step": 2140 }, { "epoch": 0.06, "learning_rate": 4.98441580985271e-06, "loss": 1.197, "step": 2141 }, { "epoch": 0.06, "learning_rate": 4.984388605051474e-06, "loss": 1.1713, "step": 2142 }, { "epoch": 0.06, "learning_rate": 4.984361376600056e-06, "loss": 1.2595, "step": 2143 }, { "epoch": 0.06, "learning_rate": 4.984334124498714e-06, "loss": 1.2227, "step": 2144 }, { "epoch": 0.06, "learning_rate": 4.984306848747707e-06, "loss": 1.1718, "step": 2145 }, { "epoch": 0.06, "learning_rate": 4.9842795493472955e-06, "loss": 1.2222, "step": 2146 }, { "epoch": 0.06, "learning_rate": 4.984252226297739e-06, "loss": 1.1146, "step": 2147 }, { "epoch": 0.06, "learning_rate": 4.9842248795992985e-06, "loss": 1.1503, "step": 2148 }, { "epoch": 0.06, "learning_rate": 4.984197509252233e-06, "loss": 1.2391, "step": 2149 }, { "epoch": 0.06, "learning_rate": 4.984170115256803e-06, "loss": 1.3014, "step": 2150 }, { "epoch": 0.06, "learning_rate": 4.984142697613271e-06, "loss": 1.168, "step": 2151 }, { "epoch": 0.06, "learning_rate": 4.984115256321897e-06, "loss": 1.1166, "step": 2152 }, { "epoch": 0.06, "learning_rate": 4.984087791382941e-06, "loss": 1.1064, "step": 2153 }, { "epoch": 0.06, "learning_rate": 4.984060302796666e-06, "loss": 1.0186, "step": 2154 }, { "epoch": 0.06, "learning_rate": 4.984032790563334e-06, "loss": 1.1801, "step": 2155 }, { "epoch": 0.06, "learning_rate": 4.9840052546832065e-06, "loss": 1.2991, "step": 2156 }, { "epoch": 0.06, "learning_rate": 4.9839776951565445e-06, "loss": 1.1566, "step": 2157 }, { "epoch": 0.07, "learning_rate": 4.983950111983611e-06, "loss": 1.1339, "step": 2158 }, { "epoch": 0.07, "learning_rate": 4.983922505164669e-06, "loss": 1.0595, "step": 2159 }, { "epoch": 0.07, "learning_rate": 4.983894874699981e-06, "loss": 1.1186, "step": 2160 }, { "epoch": 0.07, "learning_rate": 4.98386722058981e-06, "loss": 1.0469, "step": 2161 }, { "epoch": 0.07, "learning_rate": 4.98383954283442e-06, "loss": 1.2512, "step": 2162 }, { "epoch": 0.07, "learning_rate": 4.983811841434073e-06, "loss": 1.1202, "step": 2163 }, { "epoch": 0.07, "learning_rate": 4.983784116389034e-06, "loss": 1.1533, "step": 2164 }, { "epoch": 0.07, "learning_rate": 4.983756367699566e-06, "loss": 1.1595, "step": 2165 }, { "epoch": 0.07, "learning_rate": 4.983728595365933e-06, "loss": 1.2346, "step": 2166 }, { "epoch": 0.07, "learning_rate": 4.983700799388401e-06, "loss": 1.2028, "step": 2167 }, { "epoch": 0.07, "learning_rate": 4.983672979767234e-06, "loss": 1.2991, "step": 2168 }, { "epoch": 0.07, "learning_rate": 4.983645136502696e-06, "loss": 1.1478, "step": 2169 }, { "epoch": 0.07, "learning_rate": 4.983617269595052e-06, "loss": 1.1696, "step": 2170 }, { "epoch": 0.07, "learning_rate": 4.983589379044568e-06, "loss": 1.0733, "step": 2171 }, { "epoch": 0.07, "learning_rate": 4.9835614648515095e-06, "loss": 1.1381, "step": 2172 }, { "epoch": 0.07, "learning_rate": 4.983533527016142e-06, "loss": 1.2355, "step": 2173 }, { "epoch": 0.07, "learning_rate": 4.983505565538731e-06, "loss": 1.0709, "step": 2174 }, { "epoch": 0.07, "learning_rate": 4.983477580419543e-06, "loss": 1.2024, "step": 2175 }, { "epoch": 0.07, "learning_rate": 4.983449571658845e-06, "loss": 1.0659, "step": 2176 }, { "epoch": 0.07, "learning_rate": 4.983421539256903e-06, "loss": 1.2184, "step": 2177 }, { "epoch": 0.07, "learning_rate": 4.983393483213984e-06, "loss": 1.1708, "step": 2178 }, { "epoch": 0.07, "learning_rate": 4.983365403530355e-06, "loss": 1.0844, "step": 2179 }, { "epoch": 0.07, "learning_rate": 4.9833373002062834e-06, "loss": 1.0958, "step": 2180 }, { "epoch": 0.07, "learning_rate": 4.983309173242037e-06, "loss": 1.1794, "step": 2181 }, { "epoch": 0.07, "learning_rate": 4.983281022637882e-06, "loss": 1.2211, "step": 2182 }, { "epoch": 0.07, "learning_rate": 4.983252848394089e-06, "loss": 1.179, "step": 2183 }, { "epoch": 0.07, "learning_rate": 4.983224650510925e-06, "loss": 1.1646, "step": 2184 }, { "epoch": 0.07, "learning_rate": 4.983196428988658e-06, "loss": 1.0979, "step": 2185 }, { "epoch": 0.07, "learning_rate": 4.9831681838275566e-06, "loss": 1.1389, "step": 2186 }, { "epoch": 0.07, "learning_rate": 4.98313991502789e-06, "loss": 1.1805, "step": 2187 }, { "epoch": 0.07, "learning_rate": 4.983111622589928e-06, "loss": 1.1697, "step": 2188 }, { "epoch": 0.07, "learning_rate": 4.983083306513938e-06, "loss": 1.2897, "step": 2189 }, { "epoch": 0.07, "learning_rate": 4.983054966800192e-06, "loss": 1.1979, "step": 2190 }, { "epoch": 0.07, "learning_rate": 4.983026603448958e-06, "loss": 1.2167, "step": 2191 }, { "epoch": 0.07, "learning_rate": 4.982998216460507e-06, "loss": 1.1815, "step": 2192 }, { "epoch": 0.07, "learning_rate": 4.9829698058351084e-06, "loss": 1.1493, "step": 2193 }, { "epoch": 0.07, "learning_rate": 4.9829413715730335e-06, "loss": 1.0162, "step": 2194 }, { "epoch": 0.07, "learning_rate": 4.982912913674552e-06, "loss": 1.1607, "step": 2195 }, { "epoch": 0.07, "learning_rate": 4.982884432139936e-06, "loss": 1.1155, "step": 2196 }, { "epoch": 0.07, "learning_rate": 4.982855926969456e-06, "loss": 1.1547, "step": 2197 }, { "epoch": 0.07, "learning_rate": 4.982827398163383e-06, "loss": 1.1292, "step": 2198 }, { "epoch": 0.07, "learning_rate": 4.982798845721989e-06, "loss": 1.2045, "step": 2199 }, { "epoch": 0.07, "learning_rate": 4.982770269645546e-06, "loss": 1.2064, "step": 2200 }, { "epoch": 0.07, "learning_rate": 4.982741669934326e-06, "loss": 1.1305, "step": 2201 }, { "epoch": 0.07, "learning_rate": 4.9827130465886e-06, "loss": 1.1995, "step": 2202 }, { "epoch": 0.07, "learning_rate": 4.982684399608642e-06, "loss": 1.1302, "step": 2203 }, { "epoch": 0.07, "learning_rate": 4.982655728994725e-06, "loss": 1.1677, "step": 2204 }, { "epoch": 0.07, "learning_rate": 4.98262703474712e-06, "loss": 1.1941, "step": 2205 }, { "epoch": 0.07, "learning_rate": 4.982598316866102e-06, "loss": 1.1013, "step": 2206 }, { "epoch": 0.07, "learning_rate": 4.982569575351943e-06, "loss": 1.178, "step": 2207 }, { "epoch": 0.07, "learning_rate": 4.982540810204917e-06, "loss": 1.1371, "step": 2208 }, { "epoch": 0.07, "learning_rate": 4.9825120214253e-06, "loss": 1.0938, "step": 2209 }, { "epoch": 0.07, "learning_rate": 4.982483209013363e-06, "loss": 1.0757, "step": 2210 }, { "epoch": 0.07, "learning_rate": 4.982454372969382e-06, "loss": 1.3065, "step": 2211 }, { "epoch": 0.07, "learning_rate": 4.98242551329363e-06, "loss": 1.1896, "step": 2212 }, { "epoch": 0.07, "learning_rate": 4.982396629986384e-06, "loss": 1.2227, "step": 2213 }, { "epoch": 0.07, "learning_rate": 4.9823677230479165e-06, "loss": 1.1848, "step": 2214 }, { "epoch": 0.07, "learning_rate": 4.982338792478504e-06, "loss": 1.1598, "step": 2215 }, { "epoch": 0.07, "learning_rate": 4.9823098382784215e-06, "loss": 1.1686, "step": 2216 }, { "epoch": 0.07, "learning_rate": 4.982280860447946e-06, "loss": 1.1176, "step": 2217 }, { "epoch": 0.07, "learning_rate": 4.982251858987351e-06, "loss": 1.2499, "step": 2218 }, { "epoch": 0.07, "learning_rate": 4.982222833896914e-06, "loss": 1.3091, "step": 2219 }, { "epoch": 0.07, "learning_rate": 4.9821937851769114e-06, "loss": 1.2134, "step": 2220 }, { "epoch": 0.07, "learning_rate": 4.982164712827619e-06, "loss": 1.1296, "step": 2221 }, { "epoch": 0.07, "learning_rate": 4.9821356168493154e-06, "loss": 1.0604, "step": 2222 }, { "epoch": 0.07, "learning_rate": 4.982106497242275e-06, "loss": 1.1205, "step": 2223 }, { "epoch": 0.07, "learning_rate": 4.982077354006775e-06, "loss": 1.2728, "step": 2224 }, { "epoch": 0.07, "learning_rate": 4.9820481871430955e-06, "loss": 1.1606, "step": 2225 }, { "epoch": 0.07, "learning_rate": 4.982018996651513e-06, "loss": 1.126, "step": 2226 }, { "epoch": 0.07, "learning_rate": 4.981989782532305e-06, "loss": 1.1188, "step": 2227 }, { "epoch": 0.07, "learning_rate": 4.981960544785749e-06, "loss": 1.1991, "step": 2228 }, { "epoch": 0.07, "learning_rate": 4.981931283412124e-06, "loss": 1.1779, "step": 2229 }, { "epoch": 0.07, "learning_rate": 4.981901998411708e-06, "loss": 1.1218, "step": 2230 }, { "epoch": 0.07, "learning_rate": 4.981872689784781e-06, "loss": 1.251, "step": 2231 }, { "epoch": 0.07, "learning_rate": 4.9818433575316215e-06, "loss": 1.1664, "step": 2232 }, { "epoch": 0.07, "learning_rate": 4.981814001652508e-06, "loss": 1.2229, "step": 2233 }, { "epoch": 0.07, "learning_rate": 4.981784622147721e-06, "loss": 1.0662, "step": 2234 }, { "epoch": 0.07, "learning_rate": 4.981755219017539e-06, "loss": 1.1852, "step": 2235 }, { "epoch": 0.07, "learning_rate": 4.981725792262243e-06, "loss": 1.1641, "step": 2236 }, { "epoch": 0.07, "learning_rate": 4.981696341882113e-06, "loss": 1.2478, "step": 2237 }, { "epoch": 0.07, "learning_rate": 4.981666867877429e-06, "loss": 1.142, "step": 2238 }, { "epoch": 0.07, "learning_rate": 4.981637370248471e-06, "loss": 1.1741, "step": 2239 }, { "epoch": 0.07, "learning_rate": 4.981607848995521e-06, "loss": 1.1471, "step": 2240 }, { "epoch": 0.07, "learning_rate": 4.981578304118859e-06, "loss": 1.1365, "step": 2241 }, { "epoch": 0.07, "learning_rate": 4.981548735618767e-06, "loss": 1.1511, "step": 2242 }, { "epoch": 0.07, "learning_rate": 4.981519143495526e-06, "loss": 1.1849, "step": 2243 }, { "epoch": 0.07, "learning_rate": 4.981489527749418e-06, "loss": 1.1671, "step": 2244 }, { "epoch": 0.07, "learning_rate": 4.981459888380725e-06, "loss": 1.0894, "step": 2245 }, { "epoch": 0.07, "learning_rate": 4.981430225389729e-06, "loss": 1.0164, "step": 2246 }, { "epoch": 0.07, "learning_rate": 4.981400538776713e-06, "loss": 1.1099, "step": 2247 }, { "epoch": 0.07, "learning_rate": 4.981370828541957e-06, "loss": 1.2375, "step": 2248 }, { "epoch": 0.07, "learning_rate": 4.981341094685747e-06, "loss": 0.9931, "step": 2249 }, { "epoch": 0.07, "learning_rate": 4.981311337208365e-06, "loss": 1.1268, "step": 2250 }, { "epoch": 0.07, "learning_rate": 4.981281556110094e-06, "loss": 1.1611, "step": 2251 }, { "epoch": 0.07, "learning_rate": 4.9812517513912175e-06, "loss": 1.1666, "step": 2252 }, { "epoch": 0.07, "learning_rate": 4.9812219230520195e-06, "loss": 1.1737, "step": 2253 }, { "epoch": 0.07, "learning_rate": 4.981192071092783e-06, "loss": 1.1603, "step": 2254 }, { "epoch": 0.07, "learning_rate": 4.981162195513794e-06, "loss": 1.2158, "step": 2255 }, { "epoch": 0.07, "learning_rate": 4.981132296315335e-06, "loss": 1.0555, "step": 2256 }, { "epoch": 0.07, "learning_rate": 4.9811023734976925e-06, "loss": 1.236, "step": 2257 }, { "epoch": 0.07, "learning_rate": 4.9810724270611495e-06, "loss": 1.0659, "step": 2258 }, { "epoch": 0.07, "learning_rate": 4.981042457005992e-06, "loss": 1.1522, "step": 2259 }, { "epoch": 0.07, "learning_rate": 4.9810124633325056e-06, "loss": 1.0778, "step": 2260 }, { "epoch": 0.07, "learning_rate": 4.980982446040975e-06, "loss": 1.1776, "step": 2261 }, { "epoch": 0.07, "learning_rate": 4.980952405131687e-06, "loss": 1.3334, "step": 2262 }, { "epoch": 0.07, "learning_rate": 4.9809223406049265e-06, "loss": 1.2162, "step": 2263 }, { "epoch": 0.07, "learning_rate": 4.98089225246098e-06, "loss": 1.0953, "step": 2264 }, { "epoch": 0.07, "learning_rate": 4.980862140700135e-06, "loss": 1.1263, "step": 2265 }, { "epoch": 0.07, "learning_rate": 4.980832005322677e-06, "loss": 1.2361, "step": 2266 }, { "epoch": 0.07, "learning_rate": 4.980801846328892e-06, "loss": 1.173, "step": 2267 }, { "epoch": 0.07, "learning_rate": 4.980771663719069e-06, "loss": 1.079, "step": 2268 }, { "epoch": 0.07, "learning_rate": 4.9807414574934945e-06, "loss": 1.1881, "step": 2269 }, { "epoch": 0.07, "learning_rate": 4.980711227652456e-06, "loss": 1.2231, "step": 2270 }, { "epoch": 0.07, "learning_rate": 4.980680974196242e-06, "loss": 1.0372, "step": 2271 }, { "epoch": 0.07, "learning_rate": 4.980650697125139e-06, "loss": 1.088, "step": 2272 }, { "epoch": 0.07, "learning_rate": 4.9806203964394366e-06, "loss": 1.2313, "step": 2273 }, { "epoch": 0.07, "learning_rate": 4.980590072139423e-06, "loss": 1.1939, "step": 2274 }, { "epoch": 0.07, "learning_rate": 4.9805597242253855e-06, "loss": 1.1375, "step": 2275 }, { "epoch": 0.07, "learning_rate": 4.980529352697615e-06, "loss": 1.234, "step": 2276 }, { "epoch": 0.07, "learning_rate": 4.980498957556399e-06, "loss": 1.1048, "step": 2277 }, { "epoch": 0.07, "learning_rate": 4.980468538802028e-06, "loss": 1.032, "step": 2278 }, { "epoch": 0.07, "learning_rate": 4.980438096434792e-06, "loss": 1.1368, "step": 2279 }, { "epoch": 0.07, "learning_rate": 4.980407630454978e-06, "loss": 1.131, "step": 2280 }, { "epoch": 0.07, "learning_rate": 4.9803771408628795e-06, "loss": 1.1523, "step": 2281 }, { "epoch": 0.07, "learning_rate": 4.980346627658785e-06, "loss": 1.0834, "step": 2282 }, { "epoch": 0.07, "learning_rate": 4.980316090842985e-06, "loss": 1.1167, "step": 2283 }, { "epoch": 0.07, "learning_rate": 4.9802855304157714e-06, "loss": 1.2216, "step": 2284 }, { "epoch": 0.07, "learning_rate": 4.980254946377432e-06, "loss": 1.1779, "step": 2285 }, { "epoch": 0.07, "learning_rate": 4.980224338728261e-06, "loss": 1.1528, "step": 2286 }, { "epoch": 0.07, "learning_rate": 4.980193707468549e-06, "loss": 1.2634, "step": 2287 }, { "epoch": 0.07, "learning_rate": 4.980163052598588e-06, "loss": 1.0626, "step": 2288 }, { "epoch": 0.07, "learning_rate": 4.980132374118668e-06, "loss": 1.2542, "step": 2289 }, { "epoch": 0.07, "learning_rate": 4.980101672029084e-06, "loss": 1.2521, "step": 2290 }, { "epoch": 0.07, "learning_rate": 4.9800709463301246e-06, "loss": 1.2335, "step": 2291 }, { "epoch": 0.07, "learning_rate": 4.980040197022085e-06, "loss": 1.1328, "step": 2292 }, { "epoch": 0.07, "learning_rate": 4.9800094241052575e-06, "loss": 1.2114, "step": 2293 }, { "epoch": 0.07, "learning_rate": 4.979978627579934e-06, "loss": 1.1594, "step": 2294 }, { "epoch": 0.07, "learning_rate": 4.979947807446409e-06, "loss": 1.1752, "step": 2295 }, { "epoch": 0.07, "learning_rate": 4.979916963704975e-06, "loss": 1.137, "step": 2296 }, { "epoch": 0.07, "learning_rate": 4.979886096355926e-06, "loss": 1.1866, "step": 2297 }, { "epoch": 0.07, "learning_rate": 4.979855205399555e-06, "loss": 1.1406, "step": 2298 }, { "epoch": 0.07, "learning_rate": 4.979824290836158e-06, "loss": 1.165, "step": 2299 }, { "epoch": 0.07, "learning_rate": 4.979793352666027e-06, "loss": 1.1973, "step": 2300 }, { "epoch": 0.07, "learning_rate": 4.979762390889459e-06, "loss": 1.274, "step": 2301 }, { "epoch": 0.07, "learning_rate": 4.979731405506746e-06, "loss": 1.1204, "step": 2302 }, { "epoch": 0.07, "learning_rate": 4.979700396518184e-06, "loss": 1.156, "step": 2303 }, { "epoch": 0.07, "learning_rate": 4.97966936392407e-06, "loss": 1.0836, "step": 2304 }, { "epoch": 0.07, "learning_rate": 4.979638307724697e-06, "loss": 1.1205, "step": 2305 }, { "epoch": 0.07, "learning_rate": 4.979607227920361e-06, "loss": 1.1871, "step": 2306 }, { "epoch": 0.07, "learning_rate": 4.97957612451136e-06, "loss": 1.1699, "step": 2307 }, { "epoch": 0.07, "learning_rate": 4.979544997497987e-06, "loss": 1.1917, "step": 2308 }, { "epoch": 0.07, "learning_rate": 4.979513846880541e-06, "loss": 1.1547, "step": 2309 }, { "epoch": 0.07, "learning_rate": 4.979482672659316e-06, "loss": 1.1471, "step": 2310 }, { "epoch": 0.07, "learning_rate": 4.97945147483461e-06, "loss": 1.0533, "step": 2311 }, { "epoch": 0.07, "learning_rate": 4.979420253406721e-06, "loss": 1.2097, "step": 2312 }, { "epoch": 0.07, "learning_rate": 4.9793890083759455e-06, "loss": 1.1167, "step": 2313 }, { "epoch": 0.07, "learning_rate": 4.9793577397425805e-06, "loss": 1.1902, "step": 2314 }, { "epoch": 0.07, "learning_rate": 4.979326447506924e-06, "loss": 1.2245, "step": 2315 }, { "epoch": 0.07, "learning_rate": 4.979295131669274e-06, "loss": 1.1899, "step": 2316 }, { "epoch": 0.07, "learning_rate": 4.979263792229928e-06, "loss": 1.1754, "step": 2317 }, { "epoch": 0.07, "learning_rate": 4.979232429189184e-06, "loss": 1.2415, "step": 2318 }, { "epoch": 0.07, "learning_rate": 4.979201042547342e-06, "loss": 1.1138, "step": 2319 }, { "epoch": 0.07, "learning_rate": 4.979169632304701e-06, "loss": 1.1331, "step": 2320 }, { "epoch": 0.07, "learning_rate": 4.979138198461559e-06, "loss": 1.1368, "step": 2321 }, { "epoch": 0.07, "learning_rate": 4.979106741018214e-06, "loss": 1.1993, "step": 2322 }, { "epoch": 0.07, "learning_rate": 4.979075259974968e-06, "loss": 1.1702, "step": 2323 }, { "epoch": 0.07, "learning_rate": 4.979043755332119e-06, "loss": 1.213, "step": 2324 }, { "epoch": 0.07, "learning_rate": 4.979012227089967e-06, "loss": 1.1058, "step": 2325 }, { "epoch": 0.07, "learning_rate": 4.978980675248814e-06, "loss": 1.1371, "step": 2326 }, { "epoch": 0.07, "learning_rate": 4.978949099808957e-06, "loss": 1.1645, "step": 2327 }, { "epoch": 0.07, "learning_rate": 4.9789175007706994e-06, "loss": 1.2356, "step": 2328 }, { "epoch": 0.07, "learning_rate": 4.978885878134341e-06, "loss": 1.1613, "step": 2329 }, { "epoch": 0.07, "learning_rate": 4.978854231900183e-06, "loss": 1.2551, "step": 2330 }, { "epoch": 0.07, "learning_rate": 4.978822562068526e-06, "loss": 1.1619, "step": 2331 }, { "epoch": 0.07, "learning_rate": 4.978790868639673e-06, "loss": 1.0833, "step": 2332 }, { "epoch": 0.07, "learning_rate": 4.978759151613925e-06, "loss": 1.1229, "step": 2333 }, { "epoch": 0.07, "learning_rate": 4.978727410991582e-06, "loss": 1.1117, "step": 2334 }, { "epoch": 0.07, "learning_rate": 4.978695646772949e-06, "loss": 1.0671, "step": 2335 }, { "epoch": 0.07, "learning_rate": 4.9786638589583266e-06, "loss": 1.0976, "step": 2336 }, { "epoch": 0.07, "learning_rate": 4.978632047548018e-06, "loss": 1.2671, "step": 2337 }, { "epoch": 0.07, "learning_rate": 4.978600212542327e-06, "loss": 1.0799, "step": 2338 }, { "epoch": 0.07, "learning_rate": 4.978568353941555e-06, "loss": 1.1379, "step": 2339 }, { "epoch": 0.07, "learning_rate": 4.978536471746007e-06, "loss": 1.1131, "step": 2340 }, { "epoch": 0.07, "learning_rate": 4.978504565955985e-06, "loss": 1.1287, "step": 2341 }, { "epoch": 0.07, "learning_rate": 4.978472636571793e-06, "loss": 1.2994, "step": 2342 }, { "epoch": 0.07, "learning_rate": 4.978440683593735e-06, "loss": 1.1185, "step": 2343 }, { "epoch": 0.07, "learning_rate": 4.978408707022115e-06, "loss": 1.1789, "step": 2344 }, { "epoch": 0.07, "learning_rate": 4.9783767068572385e-06, "loss": 1.0994, "step": 2345 }, { "epoch": 0.07, "learning_rate": 4.9783446830994085e-06, "loss": 1.2245, "step": 2346 }, { "epoch": 0.07, "learning_rate": 4.978312635748932e-06, "loss": 1.1163, "step": 2347 }, { "epoch": 0.07, "learning_rate": 4.9782805648061116e-06, "loss": 1.1753, "step": 2348 }, { "epoch": 0.07, "learning_rate": 4.9782484702712546e-06, "loss": 1.1606, "step": 2349 }, { "epoch": 0.07, "learning_rate": 4.978216352144666e-06, "loss": 1.0797, "step": 2350 }, { "epoch": 0.07, "learning_rate": 4.97818421042665e-06, "loss": 1.0815, "step": 2351 }, { "epoch": 0.07, "learning_rate": 4.9781520451175144e-06, "loss": 1.1744, "step": 2352 }, { "epoch": 0.07, "learning_rate": 4.978119856217565e-06, "loss": 1.2491, "step": 2353 }, { "epoch": 0.07, "learning_rate": 4.978087643727108e-06, "loss": 1.0422, "step": 2354 }, { "epoch": 0.07, "learning_rate": 4.978055407646451e-06, "loss": 1.111, "step": 2355 }, { "epoch": 0.07, "learning_rate": 4.978023147975899e-06, "loss": 1.1661, "step": 2356 }, { "epoch": 0.07, "learning_rate": 4.97799086471576e-06, "loss": 1.2323, "step": 2357 }, { "epoch": 0.07, "learning_rate": 4.977958557866342e-06, "loss": 1.2089, "step": 2358 }, { "epoch": 0.07, "learning_rate": 4.977926227427951e-06, "loss": 1.1785, "step": 2359 }, { "epoch": 0.07, "learning_rate": 4.977893873400898e-06, "loss": 1.2303, "step": 2360 }, { "epoch": 0.07, "learning_rate": 4.977861495785487e-06, "loss": 1.067, "step": 2361 }, { "epoch": 0.07, "learning_rate": 4.9778290945820276e-06, "loss": 1.2122, "step": 2362 }, { "epoch": 0.07, "learning_rate": 4.977796669790829e-06, "loss": 1.1307, "step": 2363 }, { "epoch": 0.07, "learning_rate": 4.977764221412199e-06, "loss": 1.2812, "step": 2364 }, { "epoch": 0.07, "learning_rate": 4.977731749446448e-06, "loss": 1.1005, "step": 2365 }, { "epoch": 0.07, "learning_rate": 4.977699253893883e-06, "loss": 1.1333, "step": 2366 }, { "epoch": 0.07, "learning_rate": 4.977666734754814e-06, "loss": 1.1681, "step": 2367 }, { "epoch": 0.07, "learning_rate": 4.977634192029553e-06, "loss": 1.1792, "step": 2368 }, { "epoch": 0.07, "learning_rate": 4.977601625718407e-06, "loss": 1.1215, "step": 2369 }, { "epoch": 0.07, "learning_rate": 4.977569035821686e-06, "loss": 1.1732, "step": 2370 }, { "epoch": 0.07, "learning_rate": 4.977536422339701e-06, "loss": 1.1243, "step": 2371 }, { "epoch": 0.07, "learning_rate": 4.977503785272764e-06, "loss": 1.2002, "step": 2372 }, { "epoch": 0.07, "learning_rate": 4.977471124621183e-06, "loss": 1.0992, "step": 2373 }, { "epoch": 0.07, "learning_rate": 4.977438440385269e-06, "loss": 1.1509, "step": 2374 }, { "epoch": 0.07, "learning_rate": 4.977405732565336e-06, "loss": 1.1221, "step": 2375 }, { "epoch": 0.07, "learning_rate": 4.9773730011616924e-06, "loss": 1.2218, "step": 2376 }, { "epoch": 0.07, "learning_rate": 4.9773402461746525e-06, "loss": 1.1924, "step": 2377 }, { "epoch": 0.07, "learning_rate": 4.9773074676045256e-06, "loss": 1.1934, "step": 2378 }, { "epoch": 0.07, "learning_rate": 4.977274665451625e-06, "loss": 1.2609, "step": 2379 }, { "epoch": 0.07, "learning_rate": 4.9772418397162614e-06, "loss": 1.2697, "step": 2380 }, { "epoch": 0.07, "learning_rate": 4.977208990398749e-06, "loss": 1.2703, "step": 2381 }, { "epoch": 0.07, "learning_rate": 4.977176117499401e-06, "loss": 1.106, "step": 2382 }, { "epoch": 0.07, "learning_rate": 4.97714322101853e-06, "loss": 1.1057, "step": 2383 }, { "epoch": 0.07, "learning_rate": 4.977110300956447e-06, "loss": 1.1178, "step": 2384 }, { "epoch": 0.07, "learning_rate": 4.9770773573134675e-06, "loss": 1.1903, "step": 2385 }, { "epoch": 0.07, "learning_rate": 4.977044390089905e-06, "loss": 1.1535, "step": 2386 }, { "epoch": 0.07, "learning_rate": 4.977011399286072e-06, "loss": 1.2194, "step": 2387 }, { "epoch": 0.07, "learning_rate": 4.976978384902284e-06, "loss": 1.1818, "step": 2388 }, { "epoch": 0.07, "learning_rate": 4.976945346938855e-06, "loss": 1.1967, "step": 2389 }, { "epoch": 0.07, "learning_rate": 4.976912285396099e-06, "loss": 1.1846, "step": 2390 }, { "epoch": 0.07, "learning_rate": 4.976879200274332e-06, "loss": 1.1074, "step": 2391 }, { "epoch": 0.07, "learning_rate": 4.976846091573866e-06, "loss": 1.1339, "step": 2392 }, { "epoch": 0.07, "learning_rate": 4.9768129592950195e-06, "loss": 1.2009, "step": 2393 }, { "epoch": 0.07, "learning_rate": 4.976779803438106e-06, "loss": 1.1778, "step": 2394 }, { "epoch": 0.07, "learning_rate": 4.976746624003441e-06, "loss": 1.2021, "step": 2395 }, { "epoch": 0.07, "learning_rate": 4.976713420991341e-06, "loss": 1.1251, "step": 2396 }, { "epoch": 0.07, "learning_rate": 4.976680194402124e-06, "loss": 1.1, "step": 2397 }, { "epoch": 0.07, "learning_rate": 4.976646944236102e-06, "loss": 1.1834, "step": 2398 }, { "epoch": 0.07, "learning_rate": 4.9766136704935955e-06, "loss": 1.2394, "step": 2399 }, { "epoch": 0.07, "learning_rate": 4.976580373174919e-06, "loss": 1.1287, "step": 2400 }, { "epoch": 0.07, "learning_rate": 4.97654705228039e-06, "loss": 1.1708, "step": 2401 }, { "epoch": 0.07, "learning_rate": 4.976513707810326e-06, "loss": 1.0304, "step": 2402 }, { "epoch": 0.07, "learning_rate": 4.976480339765044e-06, "loss": 1.1447, "step": 2403 }, { "epoch": 0.07, "learning_rate": 4.976446948144862e-06, "loss": 1.2693, "step": 2404 }, { "epoch": 0.07, "learning_rate": 4.976413532950098e-06, "loss": 1.2212, "step": 2405 }, { "epoch": 0.07, "learning_rate": 4.976380094181069e-06, "loss": 1.2423, "step": 2406 }, { "epoch": 0.07, "learning_rate": 4.9763466318380954e-06, "loss": 1.0923, "step": 2407 }, { "epoch": 0.07, "learning_rate": 4.976313145921494e-06, "loss": 1.2371, "step": 2408 }, { "epoch": 0.07, "learning_rate": 4.976279636431583e-06, "loss": 1.165, "step": 2409 }, { "epoch": 0.07, "learning_rate": 4.976246103368685e-06, "loss": 1.255, "step": 2410 }, { "epoch": 0.07, "learning_rate": 4.976212546733115e-06, "loss": 1.3843, "step": 2411 }, { "epoch": 0.07, "learning_rate": 4.9761789665251935e-06, "loss": 1.1589, "step": 2412 }, { "epoch": 0.07, "learning_rate": 4.976145362745241e-06, "loss": 1.1118, "step": 2413 }, { "epoch": 0.07, "learning_rate": 4.9761117353935785e-06, "loss": 1.1894, "step": 2414 }, { "epoch": 0.07, "learning_rate": 4.9760780844705245e-06, "loss": 1.1779, "step": 2415 }, { "epoch": 0.07, "learning_rate": 4.976044409976399e-06, "loss": 1.0919, "step": 2416 }, { "epoch": 0.07, "learning_rate": 4.976010711911523e-06, "loss": 1.2932, "step": 2417 }, { "epoch": 0.07, "learning_rate": 4.975976990276219e-06, "loss": 1.2516, "step": 2418 }, { "epoch": 0.07, "learning_rate": 4.975943245070805e-06, "loss": 1.0366, "step": 2419 }, { "epoch": 0.07, "learning_rate": 4.9759094762956045e-06, "loss": 1.1572, "step": 2420 }, { "epoch": 0.07, "learning_rate": 4.975875683950938e-06, "loss": 1.0662, "step": 2421 }, { "epoch": 0.07, "learning_rate": 4.975841868037128e-06, "loss": 1.1621, "step": 2422 }, { "epoch": 0.07, "learning_rate": 4.9758080285544955e-06, "loss": 1.1382, "step": 2423 }, { "epoch": 0.07, "learning_rate": 4.975774165503362e-06, "loss": 1.2424, "step": 2424 }, { "epoch": 0.07, "learning_rate": 4.975740278884051e-06, "loss": 1.1293, "step": 2425 }, { "epoch": 0.07, "learning_rate": 4.975706368696886e-06, "loss": 1.1731, "step": 2426 }, { "epoch": 0.07, "learning_rate": 4.975672434942188e-06, "loss": 1.134, "step": 2427 }, { "epoch": 0.07, "learning_rate": 4.975638477620281e-06, "loss": 1.1519, "step": 2428 }, { "epoch": 0.07, "learning_rate": 4.975604496731488e-06, "loss": 1.2087, "step": 2429 }, { "epoch": 0.07, "learning_rate": 4.975570492276133e-06, "loss": 1.2567, "step": 2430 }, { "epoch": 0.07, "learning_rate": 4.975536464254538e-06, "loss": 1.1942, "step": 2431 }, { "epoch": 0.07, "learning_rate": 4.975502412667029e-06, "loss": 1.0864, "step": 2432 }, { "epoch": 0.07, "learning_rate": 4.975468337513929e-06, "loss": 1.1124, "step": 2433 }, { "epoch": 0.07, "learning_rate": 4.975434238795563e-06, "loss": 1.0667, "step": 2434 }, { "epoch": 0.07, "learning_rate": 4.975400116512255e-06, "loss": 1.1107, "step": 2435 }, { "epoch": 0.07, "learning_rate": 4.975365970664329e-06, "loss": 1.1589, "step": 2436 }, { "epoch": 0.07, "learning_rate": 4.975331801252113e-06, "loss": 1.2238, "step": 2437 }, { "epoch": 0.07, "learning_rate": 4.975297608275929e-06, "loss": 1.176, "step": 2438 }, { "epoch": 0.07, "learning_rate": 4.975263391736104e-06, "loss": 1.1591, "step": 2439 }, { "epoch": 0.07, "learning_rate": 4.975229151632965e-06, "loss": 1.1592, "step": 2440 }, { "epoch": 0.07, "learning_rate": 4.975194887966835e-06, "loss": 1.153, "step": 2441 }, { "epoch": 0.07, "learning_rate": 4.975160600738042e-06, "loss": 1.1093, "step": 2442 }, { "epoch": 0.07, "learning_rate": 4.975126289946913e-06, "loss": 1.2509, "step": 2443 }, { "epoch": 0.07, "learning_rate": 4.975091955593773e-06, "loss": 1.1122, "step": 2444 }, { "epoch": 0.07, "learning_rate": 4.9750575976789505e-06, "loss": 1.1119, "step": 2445 }, { "epoch": 0.07, "learning_rate": 4.975023216202771e-06, "loss": 1.0353, "step": 2446 }, { "epoch": 0.07, "learning_rate": 4.974988811165563e-06, "loss": 1.1084, "step": 2447 }, { "epoch": 0.07, "learning_rate": 4.974954382567652e-06, "loss": 1.1622, "step": 2448 }, { "epoch": 0.07, "learning_rate": 4.974919930409369e-06, "loss": 1.1669, "step": 2449 }, { "epoch": 0.07, "learning_rate": 4.9748854546910395e-06, "loss": 1.0735, "step": 2450 }, { "epoch": 0.07, "learning_rate": 4.9748509554129934e-06, "loss": 1.241, "step": 2451 }, { "epoch": 0.07, "learning_rate": 4.974816432575557e-06, "loss": 1.157, "step": 2452 }, { "epoch": 0.07, "learning_rate": 4.97478188617906e-06, "loss": 1.1154, "step": 2453 }, { "epoch": 0.07, "learning_rate": 4.974747316223832e-06, "loss": 1.2094, "step": 2454 }, { "epoch": 0.07, "learning_rate": 4.974712722710201e-06, "loss": 1.1556, "step": 2455 }, { "epoch": 0.07, "learning_rate": 4.974678105638497e-06, "loss": 1.1713, "step": 2456 }, { "epoch": 0.07, "learning_rate": 4.974643465009049e-06, "loss": 1.1448, "step": 2457 }, { "epoch": 0.07, "learning_rate": 4.974608800822187e-06, "loss": 1.1714, "step": 2458 }, { "epoch": 0.07, "learning_rate": 4.974574113078242e-06, "loss": 1.2101, "step": 2459 }, { "epoch": 0.07, "learning_rate": 4.974539401777542e-06, "loss": 1.0562, "step": 2460 }, { "epoch": 0.07, "learning_rate": 4.974504666920419e-06, "loss": 1.2665, "step": 2461 }, { "epoch": 0.07, "learning_rate": 4.974469908507204e-06, "loss": 1.1498, "step": 2462 }, { "epoch": 0.07, "learning_rate": 4.974435126538227e-06, "loss": 1.092, "step": 2463 }, { "epoch": 0.07, "learning_rate": 4.9744003210138185e-06, "loss": 1.1398, "step": 2464 }, { "epoch": 0.07, "learning_rate": 4.974365491934312e-06, "loss": 1.1497, "step": 2465 }, { "epoch": 0.07, "learning_rate": 4.974330639300036e-06, "loss": 1.1255, "step": 2466 }, { "epoch": 0.07, "learning_rate": 4.9742957631113255e-06, "loss": 1.2872, "step": 2467 }, { "epoch": 0.07, "learning_rate": 4.97426086336851e-06, "loss": 1.2933, "step": 2468 }, { "epoch": 0.07, "learning_rate": 4.9742259400719235e-06, "loss": 1.1274, "step": 2469 }, { "epoch": 0.07, "learning_rate": 4.974190993221897e-06, "loss": 1.1566, "step": 2470 }, { "epoch": 0.07, "learning_rate": 4.974156022818765e-06, "loss": 1.1383, "step": 2471 }, { "epoch": 0.07, "learning_rate": 4.974121028862858e-06, "loss": 1.1602, "step": 2472 }, { "epoch": 0.07, "learning_rate": 4.974086011354511e-06, "loss": 1.1967, "step": 2473 }, { "epoch": 0.07, "learning_rate": 4.974050970294056e-06, "loss": 1.1019, "step": 2474 }, { "epoch": 0.07, "learning_rate": 4.974015905681828e-06, "loss": 1.1178, "step": 2475 }, { "epoch": 0.07, "learning_rate": 4.97398081751816e-06, "loss": 1.1069, "step": 2476 }, { "epoch": 0.07, "learning_rate": 4.973945705803385e-06, "loss": 1.1702, "step": 2477 }, { "epoch": 0.07, "learning_rate": 4.9739105705378405e-06, "loss": 1.1865, "step": 2478 }, { "epoch": 0.07, "learning_rate": 4.973875411721858e-06, "loss": 1.1039, "step": 2479 }, { "epoch": 0.07, "learning_rate": 4.973840229355772e-06, "loss": 1.2833, "step": 2480 }, { "epoch": 0.07, "learning_rate": 4.973805023439919e-06, "loss": 1.1337, "step": 2481 }, { "epoch": 0.07, "learning_rate": 4.973769793974634e-06, "loss": 1.2246, "step": 2482 }, { "epoch": 0.07, "learning_rate": 4.973734540960252e-06, "loss": 1.0942, "step": 2483 }, { "epoch": 0.07, "learning_rate": 4.973699264397109e-06, "loss": 1.1484, "step": 2484 }, { "epoch": 0.07, "learning_rate": 4.97366396428554e-06, "loss": 1.1165, "step": 2485 }, { "epoch": 0.07, "learning_rate": 4.973628640625881e-06, "loss": 1.2441, "step": 2486 }, { "epoch": 0.07, "learning_rate": 4.973593293418469e-06, "loss": 1.1199, "step": 2487 }, { "epoch": 0.07, "learning_rate": 4.97355792266364e-06, "loss": 1.1995, "step": 2488 }, { "epoch": 0.07, "learning_rate": 4.973522528361731e-06, "loss": 1.2446, "step": 2489 }, { "epoch": 0.08, "learning_rate": 4.973487110513079e-06, "loss": 1.1167, "step": 2490 }, { "epoch": 0.08, "learning_rate": 4.97345166911802e-06, "loss": 1.1309, "step": 2491 }, { "epoch": 0.08, "learning_rate": 4.973416204176893e-06, "loss": 1.2407, "step": 2492 }, { "epoch": 0.08, "learning_rate": 4.973380715690036e-06, "loss": 1.1092, "step": 2493 }, { "epoch": 0.08, "learning_rate": 4.973345203657785e-06, "loss": 1.1184, "step": 2494 }, { "epoch": 0.08, "learning_rate": 4.9733096680804785e-06, "loss": 1.1964, "step": 2495 }, { "epoch": 0.08, "learning_rate": 4.973274108958455e-06, "loss": 1.2279, "step": 2496 }, { "epoch": 0.08, "learning_rate": 4.973238526292054e-06, "loss": 1.1384, "step": 2497 }, { "epoch": 0.08, "learning_rate": 4.973202920081612e-06, "loss": 1.1202, "step": 2498 }, { "epoch": 0.08, "learning_rate": 4.973167290327471e-06, "loss": 1.1771, "step": 2499 }, { "epoch": 0.08, "learning_rate": 4.973131637029967e-06, "loss": 1.2191, "step": 2500 }, { "epoch": 0.08, "learning_rate": 4.973095960189443e-06, "loss": 1.0993, "step": 2501 }, { "epoch": 0.08, "learning_rate": 4.9730602598062346e-06, "loss": 1.1334, "step": 2502 }, { "epoch": 0.08, "learning_rate": 4.973024535880684e-06, "loss": 1.0573, "step": 2503 }, { "epoch": 0.08, "learning_rate": 4.972988788413131e-06, "loss": 1.2072, "step": 2504 }, { "epoch": 0.08, "learning_rate": 4.972953017403917e-06, "loss": 1.1862, "step": 2505 }, { "epoch": 0.08, "learning_rate": 4.972917222853379e-06, "loss": 1.1123, "step": 2506 }, { "epoch": 0.08, "learning_rate": 4.972881404761861e-06, "loss": 1.1371, "step": 2507 }, { "epoch": 0.08, "learning_rate": 4.972845563129704e-06, "loss": 1.1373, "step": 2508 }, { "epoch": 0.08, "learning_rate": 4.972809697957247e-06, "loss": 1.0532, "step": 2509 }, { "epoch": 0.08, "learning_rate": 4.972773809244833e-06, "loss": 1.0837, "step": 2510 }, { "epoch": 0.08, "learning_rate": 4.972737896992804e-06, "loss": 1.2242, "step": 2511 }, { "epoch": 0.08, "learning_rate": 4.9727019612015e-06, "loss": 1.2007, "step": 2512 }, { "epoch": 0.08, "learning_rate": 4.9726660018712645e-06, "loss": 1.1073, "step": 2513 }, { "epoch": 0.08, "learning_rate": 4.9726300190024405e-06, "loss": 1.2397, "step": 2514 }, { "epoch": 0.08, "learning_rate": 4.972594012595369e-06, "loss": 1.1414, "step": 2515 }, { "epoch": 0.08, "learning_rate": 4.9725579826503924e-06, "loss": 1.1888, "step": 2516 }, { "epoch": 0.08, "learning_rate": 4.972521929167855e-06, "loss": 1.1206, "step": 2517 }, { "epoch": 0.08, "learning_rate": 4.9724858521481005e-06, "loss": 1.1288, "step": 2518 }, { "epoch": 0.08, "learning_rate": 4.972449751591471e-06, "loss": 1.0701, "step": 2519 }, { "epoch": 0.08, "learning_rate": 4.972413627498311e-06, "loss": 1.0913, "step": 2520 }, { "epoch": 0.08, "learning_rate": 4.972377479868963e-06, "loss": 1.2262, "step": 2521 }, { "epoch": 0.08, "learning_rate": 4.972341308703773e-06, "loss": 1.2351, "step": 2522 }, { "epoch": 0.08, "learning_rate": 4.972305114003084e-06, "loss": 1.1095, "step": 2523 }, { "epoch": 0.08, "learning_rate": 4.972268895767242e-06, "loss": 1.3137, "step": 2524 }, { "epoch": 0.08, "learning_rate": 4.9722326539965895e-06, "loss": 1.3156, "step": 2525 }, { "epoch": 0.08, "learning_rate": 4.972196388691473e-06, "loss": 1.1651, "step": 2526 }, { "epoch": 0.08, "learning_rate": 4.972160099852238e-06, "loss": 1.2574, "step": 2527 }, { "epoch": 0.08, "learning_rate": 4.9721237874792294e-06, "loss": 1.2234, "step": 2528 }, { "epoch": 0.08, "learning_rate": 4.972087451572793e-06, "loss": 1.1858, "step": 2529 }, { "epoch": 0.08, "learning_rate": 4.972051092133274e-06, "loss": 1.1736, "step": 2530 }, { "epoch": 0.08, "learning_rate": 4.972014709161021e-06, "loss": 1.3253, "step": 2531 }, { "epoch": 0.08, "learning_rate": 4.971978302656377e-06, "loss": 1.1191, "step": 2532 }, { "epoch": 0.08, "learning_rate": 4.97194187261969e-06, "loss": 1.1828, "step": 2533 }, { "epoch": 0.08, "learning_rate": 4.971905419051307e-06, "loss": 1.1091, "step": 2534 }, { "epoch": 0.08, "learning_rate": 4.971868941951575e-06, "loss": 1.0854, "step": 2535 }, { "epoch": 0.08, "learning_rate": 4.9718324413208415e-06, "loss": 1.1924, "step": 2536 }, { "epoch": 0.08, "learning_rate": 4.971795917159454e-06, "loss": 1.1523, "step": 2537 }, { "epoch": 0.08, "learning_rate": 4.971759369467759e-06, "loss": 1.1993, "step": 2538 }, { "epoch": 0.08, "learning_rate": 4.9717227982461055e-06, "loss": 1.1239, "step": 2539 }, { "epoch": 0.08, "learning_rate": 4.971686203494842e-06, "loss": 1.2415, "step": 2540 }, { "epoch": 0.08, "learning_rate": 4.971649585214315e-06, "loss": 1.1077, "step": 2541 }, { "epoch": 0.08, "learning_rate": 4.971612943404876e-06, "loss": 1.2751, "step": 2542 }, { "epoch": 0.08, "learning_rate": 4.971576278066871e-06, "loss": 1.2079, "step": 2543 }, { "epoch": 0.08, "learning_rate": 4.97153958920065e-06, "loss": 1.0312, "step": 2544 }, { "epoch": 0.08, "learning_rate": 4.971502876806563e-06, "loss": 1.0806, "step": 2545 }, { "epoch": 0.08, "learning_rate": 4.971466140884958e-06, "loss": 1.1174, "step": 2546 }, { "epoch": 0.08, "learning_rate": 4.9714293814361865e-06, "loss": 1.2775, "step": 2547 }, { "epoch": 0.08, "learning_rate": 4.971392598460598e-06, "loss": 1.1641, "step": 2548 }, { "epoch": 0.08, "learning_rate": 4.971355791958542e-06, "loss": 1.2115, "step": 2549 }, { "epoch": 0.08, "learning_rate": 4.971318961930368e-06, "loss": 1.0908, "step": 2550 }, { "epoch": 0.08, "learning_rate": 4.971282108376429e-06, "loss": 1.1742, "step": 2551 }, { "epoch": 0.08, "learning_rate": 4.971245231297074e-06, "loss": 1.1703, "step": 2552 }, { "epoch": 0.08, "learning_rate": 4.971208330692655e-06, "loss": 1.1992, "step": 2553 }, { "epoch": 0.08, "learning_rate": 4.971171406563522e-06, "loss": 1.2034, "step": 2554 }, { "epoch": 0.08, "learning_rate": 4.971134458910028e-06, "loss": 1.2306, "step": 2555 }, { "epoch": 0.08, "learning_rate": 4.971097487732524e-06, "loss": 1.1556, "step": 2556 }, { "epoch": 0.08, "learning_rate": 4.9710604930313625e-06, "loss": 1.1992, "step": 2557 }, { "epoch": 0.08, "learning_rate": 4.971023474806894e-06, "loss": 1.1165, "step": 2558 }, { "epoch": 0.08, "learning_rate": 4.970986433059473e-06, "loss": 1.1194, "step": 2559 }, { "epoch": 0.08, "learning_rate": 4.970949367789451e-06, "loss": 1.0812, "step": 2560 }, { "epoch": 0.08, "learning_rate": 4.9709122789971805e-06, "loss": 1.1432, "step": 2561 }, { "epoch": 0.08, "learning_rate": 4.970875166683017e-06, "loss": 1.1439, "step": 2562 }, { "epoch": 0.08, "learning_rate": 4.97083803084731e-06, "loss": 1.0571, "step": 2563 }, { "epoch": 0.08, "learning_rate": 4.970800871490415e-06, "loss": 1.2118, "step": 2564 }, { "epoch": 0.08, "learning_rate": 4.970763688612687e-06, "loss": 1.1707, "step": 2565 }, { "epoch": 0.08, "learning_rate": 4.970726482214478e-06, "loss": 1.1771, "step": 2566 }, { "epoch": 0.08, "learning_rate": 4.970689252296142e-06, "loss": 1.3208, "step": 2567 }, { "epoch": 0.08, "learning_rate": 4.970651998858036e-06, "loss": 1.2413, "step": 2568 }, { "epoch": 0.08, "learning_rate": 4.970614721900512e-06, "loss": 1.0828, "step": 2569 }, { "epoch": 0.08, "learning_rate": 4.970577421423925e-06, "loss": 1.278, "step": 2570 }, { "epoch": 0.08, "learning_rate": 4.970540097428632e-06, "loss": 1.0607, "step": 2571 }, { "epoch": 0.08, "learning_rate": 4.970502749914986e-06, "loss": 1.1439, "step": 2572 }, { "epoch": 0.08, "learning_rate": 4.970465378883345e-06, "loss": 1.1781, "step": 2573 }, { "epoch": 0.08, "learning_rate": 4.970427984334062e-06, "loss": 1.1423, "step": 2574 }, { "epoch": 0.08, "learning_rate": 4.970390566267495e-06, "loss": 1.1765, "step": 2575 }, { "epoch": 0.08, "learning_rate": 4.970353124684e-06, "loss": 1.0581, "step": 2576 }, { "epoch": 0.08, "learning_rate": 4.9703156595839325e-06, "loss": 1.1124, "step": 2577 }, { "epoch": 0.08, "learning_rate": 4.9702781709676495e-06, "loss": 1.1677, "step": 2578 }, { "epoch": 0.08, "learning_rate": 4.970240658835508e-06, "loss": 1.1824, "step": 2579 }, { "epoch": 0.08, "learning_rate": 4.970203123187866e-06, "loss": 1.1627, "step": 2580 }, { "epoch": 0.08, "learning_rate": 4.970165564025079e-06, "loss": 1.1066, "step": 2581 }, { "epoch": 0.08, "learning_rate": 4.970127981347507e-06, "loss": 1.1246, "step": 2582 }, { "epoch": 0.08, "learning_rate": 4.970090375155505e-06, "loss": 1.1619, "step": 2583 }, { "epoch": 0.08, "learning_rate": 4.9700527454494315e-06, "loss": 1.0868, "step": 2584 }, { "epoch": 0.08, "learning_rate": 4.970015092229647e-06, "loss": 1.1823, "step": 2585 }, { "epoch": 0.08, "learning_rate": 4.969977415496508e-06, "loss": 1.1882, "step": 2586 }, { "epoch": 0.08, "learning_rate": 4.9699397152503734e-06, "loss": 1.1821, "step": 2587 }, { "epoch": 0.08, "learning_rate": 4.9699019914916024e-06, "loss": 1.1948, "step": 2588 }, { "epoch": 0.08, "learning_rate": 4.969864244220554e-06, "loss": 1.147, "step": 2589 }, { "epoch": 0.08, "learning_rate": 4.9698264734375874e-06, "loss": 1.139, "step": 2590 }, { "epoch": 0.08, "learning_rate": 4.9697886791430625e-06, "loss": 1.2021, "step": 2591 }, { "epoch": 0.08, "learning_rate": 4.969750861337338e-06, "loss": 1.224, "step": 2592 }, { "epoch": 0.08, "learning_rate": 4.9697130200207754e-06, "loss": 1.1225, "step": 2593 }, { "epoch": 0.08, "learning_rate": 4.969675155193735e-06, "loss": 1.1502, "step": 2594 }, { "epoch": 0.08, "learning_rate": 4.969637266856576e-06, "loss": 1.1721, "step": 2595 }, { "epoch": 0.08, "learning_rate": 4.96959935500966e-06, "loss": 1.1217, "step": 2596 }, { "epoch": 0.08, "learning_rate": 4.969561419653347e-06, "loss": 1.0771, "step": 2597 }, { "epoch": 0.08, "learning_rate": 4.9695234607879986e-06, "loss": 1.1263, "step": 2598 }, { "epoch": 0.08, "learning_rate": 4.969485478413976e-06, "loss": 1.2081, "step": 2599 }, { "epoch": 0.08, "learning_rate": 4.969447472531641e-06, "loss": 1.0327, "step": 2600 }, { "epoch": 0.08, "learning_rate": 4.969409443141356e-06, "loss": 1.2365, "step": 2601 }, { "epoch": 0.08, "learning_rate": 4.969371390243483e-06, "loss": 1.0519, "step": 2602 }, { "epoch": 0.08, "learning_rate": 4.969333313838382e-06, "loss": 1.2091, "step": 2603 }, { "epoch": 0.08, "learning_rate": 4.969295213926418e-06, "loss": 1.1888, "step": 2604 }, { "epoch": 0.08, "learning_rate": 4.969257090507953e-06, "loss": 1.1405, "step": 2605 }, { "epoch": 0.08, "learning_rate": 4.9692189435833495e-06, "loss": 1.1331, "step": 2606 }, { "epoch": 0.08, "learning_rate": 4.969180773152971e-06, "loss": 1.0916, "step": 2607 }, { "epoch": 0.08, "learning_rate": 4.96914257921718e-06, "loss": 1.2206, "step": 2608 }, { "epoch": 0.08, "learning_rate": 4.969104361776342e-06, "loss": 1.113, "step": 2609 }, { "epoch": 0.08, "learning_rate": 4.9690661208308185e-06, "loss": 1.0297, "step": 2610 }, { "epoch": 0.08, "learning_rate": 4.9690278563809755e-06, "loss": 1.1425, "step": 2611 }, { "epoch": 0.08, "learning_rate": 4.968989568427176e-06, "loss": 1.1799, "step": 2612 }, { "epoch": 0.08, "learning_rate": 4.968951256969785e-06, "loss": 1.151, "step": 2613 }, { "epoch": 0.08, "learning_rate": 4.9689129220091675e-06, "loss": 1.1987, "step": 2614 }, { "epoch": 0.08, "learning_rate": 4.968874563545688e-06, "loss": 1.1485, "step": 2615 }, { "epoch": 0.08, "learning_rate": 4.9688361815797115e-06, "loss": 1.222, "step": 2616 }, { "epoch": 0.08, "learning_rate": 4.9687977761116035e-06, "loss": 1.1161, "step": 2617 }, { "epoch": 0.08, "learning_rate": 4.9687593471417296e-06, "loss": 1.1352, "step": 2618 }, { "epoch": 0.08, "learning_rate": 4.9687208946704555e-06, "loss": 1.2532, "step": 2619 }, { "epoch": 0.08, "learning_rate": 4.968682418698148e-06, "loss": 1.236, "step": 2620 }, { "epoch": 0.08, "learning_rate": 4.968643919225173e-06, "loss": 1.0186, "step": 2621 }, { "epoch": 0.08, "learning_rate": 4.968605396251896e-06, "loss": 1.0884, "step": 2622 }, { "epoch": 0.08, "learning_rate": 4.9685668497786855e-06, "loss": 1.2299, "step": 2623 }, { "epoch": 0.08, "learning_rate": 4.968528279805907e-06, "loss": 1.1835, "step": 2624 }, { "epoch": 0.08, "learning_rate": 4.968489686333928e-06, "loss": 1.103, "step": 2625 }, { "epoch": 0.08, "learning_rate": 4.9684510693631165e-06, "loss": 1.0466, "step": 2626 }, { "epoch": 0.08, "learning_rate": 4.9684124288938395e-06, "loss": 1.2383, "step": 2627 }, { "epoch": 0.08, "learning_rate": 4.968373764926465e-06, "loss": 1.0576, "step": 2628 }, { "epoch": 0.08, "learning_rate": 4.968335077461361e-06, "loss": 1.0831, "step": 2629 }, { "epoch": 0.08, "learning_rate": 4.968296366498896e-06, "loss": 1.1729, "step": 2630 }, { "epoch": 0.08, "learning_rate": 4.968257632039438e-06, "loss": 1.1721, "step": 2631 }, { "epoch": 0.08, "learning_rate": 4.968218874083356e-06, "loss": 1.0349, "step": 2632 }, { "epoch": 0.08, "learning_rate": 4.9681800926310196e-06, "loss": 1.1046, "step": 2633 }, { "epoch": 0.08, "learning_rate": 4.968141287682797e-06, "loss": 1.1819, "step": 2634 }, { "epoch": 0.08, "learning_rate": 4.968102459239058e-06, "loss": 1.0283, "step": 2635 }, { "epoch": 0.08, "learning_rate": 4.968063607300173e-06, "loss": 1.2427, "step": 2636 }, { "epoch": 0.08, "learning_rate": 4.96802473186651e-06, "loss": 1.1804, "step": 2637 }, { "epoch": 0.08, "learning_rate": 4.967985832938441e-06, "loss": 1.2158, "step": 2638 }, { "epoch": 0.08, "learning_rate": 4.967946910516336e-06, "loss": 1.2183, "step": 2639 }, { "epoch": 0.08, "learning_rate": 4.967907964600563e-06, "loss": 1.1858, "step": 2640 }, { "epoch": 0.08, "learning_rate": 4.967868995191497e-06, "loss": 1.1481, "step": 2641 }, { "epoch": 0.08, "learning_rate": 4.967830002289505e-06, "loss": 1.0664, "step": 2642 }, { "epoch": 0.08, "learning_rate": 4.967790985894961e-06, "loss": 1.2611, "step": 2643 }, { "epoch": 0.08, "learning_rate": 4.967751946008235e-06, "loss": 1.1627, "step": 2644 }, { "epoch": 0.08, "learning_rate": 4.967712882629699e-06, "loss": 1.1399, "step": 2645 }, { "epoch": 0.08, "learning_rate": 4.967673795759726e-06, "loss": 1.2074, "step": 2646 }, { "epoch": 0.08, "learning_rate": 4.967634685398685e-06, "loss": 1.2109, "step": 2647 }, { "epoch": 0.08, "learning_rate": 4.967595551546951e-06, "loss": 1.2366, "step": 2648 }, { "epoch": 0.08, "learning_rate": 4.967556394204896e-06, "loss": 1.1979, "step": 2649 }, { "epoch": 0.08, "learning_rate": 4.967517213372892e-06, "loss": 1.1648, "step": 2650 }, { "epoch": 0.08, "learning_rate": 4.967478009051313e-06, "loss": 1.1372, "step": 2651 }, { "epoch": 0.08, "learning_rate": 4.967438781240532e-06, "loss": 1.1874, "step": 2652 }, { "epoch": 0.08, "learning_rate": 4.967399529940922e-06, "loss": 1.0513, "step": 2653 }, { "epoch": 0.08, "learning_rate": 4.967360255152857e-06, "loss": 1.0471, "step": 2654 }, { "epoch": 0.08, "learning_rate": 4.96732095687671e-06, "loss": 1.2137, "step": 2655 }, { "epoch": 0.08, "learning_rate": 4.967281635112856e-06, "loss": 1.2463, "step": 2656 }, { "epoch": 0.08, "learning_rate": 4.967242289861669e-06, "loss": 1.2393, "step": 2657 }, { "epoch": 0.08, "learning_rate": 4.967202921123524e-06, "loss": 1.1414, "step": 2658 }, { "epoch": 0.08, "learning_rate": 4.9671635288987955e-06, "loss": 1.1206, "step": 2659 }, { "epoch": 0.08, "learning_rate": 4.9671241131878575e-06, "loss": 1.178, "step": 2660 }, { "epoch": 0.08, "learning_rate": 4.967084673991088e-06, "loss": 1.1614, "step": 2661 }, { "epoch": 0.08, "learning_rate": 4.967045211308859e-06, "loss": 1.2672, "step": 2662 }, { "epoch": 0.08, "learning_rate": 4.967005725141548e-06, "loss": 1.1768, "step": 2663 }, { "epoch": 0.08, "learning_rate": 4.966966215489532e-06, "loss": 1.1965, "step": 2664 }, { "epoch": 0.08, "learning_rate": 4.966926682353184e-06, "loss": 1.065, "step": 2665 }, { "epoch": 0.08, "learning_rate": 4.966887125732883e-06, "loss": 1.2606, "step": 2666 }, { "epoch": 0.08, "learning_rate": 4.9668475456290046e-06, "loss": 1.2399, "step": 2667 }, { "epoch": 0.08, "learning_rate": 4.966807942041925e-06, "loss": 1.0883, "step": 2668 }, { "epoch": 0.08, "learning_rate": 4.9667683149720225e-06, "loss": 1.2025, "step": 2669 }, { "epoch": 0.08, "learning_rate": 4.9667286644196735e-06, "loss": 1.1801, "step": 2670 }, { "epoch": 0.08, "learning_rate": 4.9666889903852555e-06, "loss": 1.2102, "step": 2671 }, { "epoch": 0.08, "learning_rate": 4.966649292869147e-06, "loss": 1.1164, "step": 2672 }, { "epoch": 0.08, "learning_rate": 4.966609571871724e-06, "loss": 1.1183, "step": 2673 }, { "epoch": 0.08, "learning_rate": 4.966569827393367e-06, "loss": 1.1655, "step": 2674 }, { "epoch": 0.08, "learning_rate": 4.966530059434452e-06, "loss": 1.0982, "step": 2675 }, { "epoch": 0.08, "learning_rate": 4.96649026799536e-06, "loss": 1.0613, "step": 2676 }, { "epoch": 0.08, "learning_rate": 4.966450453076468e-06, "loss": 1.2664, "step": 2677 }, { "epoch": 0.08, "learning_rate": 4.966410614678155e-06, "loss": 1.0391, "step": 2678 }, { "epoch": 0.08, "learning_rate": 4.966370752800802e-06, "loss": 1.1491, "step": 2679 }, { "epoch": 0.08, "learning_rate": 4.966330867444786e-06, "loss": 1.1532, "step": 2680 }, { "epoch": 0.08, "learning_rate": 4.966290958610489e-06, "loss": 1.1063, "step": 2681 }, { "epoch": 0.08, "learning_rate": 4.96625102629829e-06, "loss": 1.1137, "step": 2682 }, { "epoch": 0.08, "learning_rate": 4.9662110705085684e-06, "loss": 1.1227, "step": 2683 }, { "epoch": 0.08, "learning_rate": 4.966171091241705e-06, "loss": 1.1021, "step": 2684 }, { "epoch": 0.08, "learning_rate": 4.966131088498081e-06, "loss": 1.2235, "step": 2685 }, { "epoch": 0.08, "learning_rate": 4.9660910622780764e-06, "loss": 1.1677, "step": 2686 }, { "epoch": 0.08, "learning_rate": 4.966051012582073e-06, "loss": 1.1419, "step": 2687 }, { "epoch": 0.08, "learning_rate": 4.966010939410451e-06, "loss": 1.1201, "step": 2688 }, { "epoch": 0.08, "learning_rate": 4.965970842763594e-06, "loss": 1.1387, "step": 2689 }, { "epoch": 0.08, "learning_rate": 4.96593072264188e-06, "loss": 1.1815, "step": 2690 }, { "epoch": 0.08, "learning_rate": 4.965890579045695e-06, "loss": 1.1275, "step": 2691 }, { "epoch": 0.08, "learning_rate": 4.9658504119754185e-06, "loss": 1.157, "step": 2692 }, { "epoch": 0.08, "learning_rate": 4.965810221431434e-06, "loss": 1.1127, "step": 2693 }, { "epoch": 0.08, "learning_rate": 4.965770007414124e-06, "loss": 1.1695, "step": 2694 }, { "epoch": 0.08, "learning_rate": 4.96572976992387e-06, "loss": 1.0901, "step": 2695 }, { "epoch": 0.08, "learning_rate": 4.9656895089610565e-06, "loss": 1.1124, "step": 2696 }, { "epoch": 0.08, "learning_rate": 4.965649224526067e-06, "loss": 1.2206, "step": 2697 }, { "epoch": 0.08, "learning_rate": 4.9656089166192845e-06, "loss": 1.2491, "step": 2698 }, { "epoch": 0.08, "learning_rate": 4.965568585241092e-06, "loss": 1.1542, "step": 2699 }, { "epoch": 0.08, "learning_rate": 4.965528230391874e-06, "loss": 1.116, "step": 2700 }, { "epoch": 0.08, "learning_rate": 4.965487852072015e-06, "loss": 1.0494, "step": 2701 }, { "epoch": 0.08, "learning_rate": 4.965447450281899e-06, "loss": 1.0958, "step": 2702 }, { "epoch": 0.08, "learning_rate": 4.965407025021911e-06, "loss": 1.1385, "step": 2703 }, { "epoch": 0.08, "learning_rate": 4.965366576292435e-06, "loss": 1.2639, "step": 2704 }, { "epoch": 0.08, "learning_rate": 4.965326104093857e-06, "loss": 1.1647, "step": 2705 }, { "epoch": 0.08, "learning_rate": 4.965285608426561e-06, "loss": 1.0934, "step": 2706 }, { "epoch": 0.08, "learning_rate": 4.9652450892909345e-06, "loss": 1.1693, "step": 2707 }, { "epoch": 0.08, "learning_rate": 4.965204546687361e-06, "loss": 1.1772, "step": 2708 }, { "epoch": 0.08, "learning_rate": 4.965163980616228e-06, "loss": 1.1815, "step": 2709 }, { "epoch": 0.08, "learning_rate": 4.965123391077921e-06, "loss": 1.1492, "step": 2710 }, { "epoch": 0.08, "learning_rate": 4.965082778072826e-06, "loss": 1.0486, "step": 2711 }, { "epoch": 0.08, "learning_rate": 4.965042141601332e-06, "loss": 1.1584, "step": 2712 }, { "epoch": 0.08, "learning_rate": 4.965001481663823e-06, "loss": 1.1807, "step": 2713 }, { "epoch": 0.08, "learning_rate": 4.9649607982606865e-06, "loss": 1.1685, "step": 2714 }, { "epoch": 0.08, "learning_rate": 4.96492009139231e-06, "loss": 1.0996, "step": 2715 }, { "epoch": 0.08, "learning_rate": 4.964879361059083e-06, "loss": 1.1992, "step": 2716 }, { "epoch": 0.08, "learning_rate": 4.96483860726139e-06, "loss": 1.0641, "step": 2717 }, { "epoch": 0.08, "learning_rate": 4.964797829999622e-06, "loss": 1.3025, "step": 2718 }, { "epoch": 0.08, "learning_rate": 4.964757029274164e-06, "loss": 1.0355, "step": 2719 }, { "epoch": 0.08, "learning_rate": 4.964716205085408e-06, "loss": 1.1327, "step": 2720 }, { "epoch": 0.08, "learning_rate": 4.9646753574337405e-06, "loss": 1.1056, "step": 2721 }, { "epoch": 0.08, "learning_rate": 4.96463448631955e-06, "loss": 1.1147, "step": 2722 }, { "epoch": 0.08, "learning_rate": 4.9645935917432265e-06, "loss": 1.2156, "step": 2723 }, { "epoch": 0.08, "learning_rate": 4.964552673705159e-06, "loss": 1.1366, "step": 2724 }, { "epoch": 0.08, "learning_rate": 4.964511732205736e-06, "loss": 1.1793, "step": 2725 }, { "epoch": 0.08, "learning_rate": 4.96447076724535e-06, "loss": 1.171, "step": 2726 }, { "epoch": 0.08, "learning_rate": 4.964429778824388e-06, "loss": 1.1721, "step": 2727 }, { "epoch": 0.08, "learning_rate": 4.964388766943241e-06, "loss": 1.0599, "step": 2728 }, { "epoch": 0.08, "learning_rate": 4.964347731602301e-06, "loss": 1.1729, "step": 2729 }, { "epoch": 0.08, "learning_rate": 4.964306672801957e-06, "loss": 1.1495, "step": 2730 }, { "epoch": 0.08, "learning_rate": 4.964265590542601e-06, "loss": 1.2222, "step": 2731 }, { "epoch": 0.08, "learning_rate": 4.964224484824622e-06, "loss": 1.1937, "step": 2732 }, { "epoch": 0.08, "learning_rate": 4.964183355648414e-06, "loss": 1.1004, "step": 2733 }, { "epoch": 0.08, "learning_rate": 4.964142203014366e-06, "loss": 1.126, "step": 2734 }, { "epoch": 0.08, "learning_rate": 4.964101026922872e-06, "loss": 1.1624, "step": 2735 }, { "epoch": 0.08, "learning_rate": 4.964059827374323e-06, "loss": 1.1232, "step": 2736 }, { "epoch": 0.08, "learning_rate": 4.964018604369111e-06, "loss": 1.1885, "step": 2737 }, { "epoch": 0.08, "learning_rate": 4.963977357907628e-06, "loss": 1.097, "step": 2738 }, { "epoch": 0.08, "learning_rate": 4.963936087990267e-06, "loss": 1.1998, "step": 2739 }, { "epoch": 0.08, "learning_rate": 4.963894794617422e-06, "loss": 1.1417, "step": 2740 }, { "epoch": 0.08, "learning_rate": 4.963853477789486e-06, "loss": 1.097, "step": 2741 }, { "epoch": 0.08, "learning_rate": 4.96381213750685e-06, "loss": 1.2522, "step": 2742 }, { "epoch": 0.08, "learning_rate": 4.96377077376991e-06, "loss": 1.2993, "step": 2743 }, { "epoch": 0.08, "learning_rate": 4.963729386579058e-06, "loss": 1.0817, "step": 2744 }, { "epoch": 0.08, "learning_rate": 4.96368797593469e-06, "loss": 1.0551, "step": 2745 }, { "epoch": 0.08, "learning_rate": 4.9636465418371984e-06, "loss": 1.1349, "step": 2746 }, { "epoch": 0.08, "learning_rate": 4.963605084286978e-06, "loss": 1.0811, "step": 2747 }, { "epoch": 0.08, "learning_rate": 4.963563603284424e-06, "loss": 1.1995, "step": 2748 }, { "epoch": 0.08, "learning_rate": 4.963522098829931e-06, "loss": 1.1502, "step": 2749 }, { "epoch": 0.08, "learning_rate": 4.963480570923893e-06, "loss": 1.243, "step": 2750 }, { "epoch": 0.08, "learning_rate": 4.963439019566708e-06, "loss": 1.1171, "step": 2751 }, { "epoch": 0.08, "learning_rate": 4.963397444758769e-06, "loss": 1.0053, "step": 2752 }, { "epoch": 0.08, "learning_rate": 4.9633558465004736e-06, "loss": 1.176, "step": 2753 }, { "epoch": 0.08, "learning_rate": 4.963314224792216e-06, "loss": 1.1128, "step": 2754 }, { "epoch": 0.08, "learning_rate": 4.963272579634394e-06, "loss": 1.1052, "step": 2755 }, { "epoch": 0.08, "learning_rate": 4.9632309110274026e-06, "loss": 1.2751, "step": 2756 }, { "epoch": 0.08, "learning_rate": 4.96318921897164e-06, "loss": 1.1329, "step": 2757 }, { "epoch": 0.08, "learning_rate": 4.963147503467503e-06, "loss": 1.2058, "step": 2758 }, { "epoch": 0.08, "learning_rate": 4.963105764515387e-06, "loss": 1.1125, "step": 2759 }, { "epoch": 0.08, "learning_rate": 4.96306400211569e-06, "loss": 1.2148, "step": 2760 }, { "epoch": 0.08, "learning_rate": 4.963022216268811e-06, "loss": 1.1965, "step": 2761 }, { "epoch": 0.08, "learning_rate": 4.962980406975147e-06, "loss": 1.1906, "step": 2762 }, { "epoch": 0.08, "learning_rate": 4.962938574235095e-06, "loss": 1.1367, "step": 2763 }, { "epoch": 0.08, "learning_rate": 4.962896718049053e-06, "loss": 1.1877, "step": 2764 }, { "epoch": 0.08, "learning_rate": 4.9628548384174215e-06, "loss": 1.144, "step": 2765 }, { "epoch": 0.08, "learning_rate": 4.962812935340598e-06, "loss": 1.1688, "step": 2766 }, { "epoch": 0.08, "learning_rate": 4.962771008818982e-06, "loss": 1.1544, "step": 2767 }, { "epoch": 0.08, "learning_rate": 4.962729058852971e-06, "loss": 1.214, "step": 2768 }, { "epoch": 0.08, "learning_rate": 4.9626870854429665e-06, "loss": 1.3304, "step": 2769 }, { "epoch": 0.08, "learning_rate": 4.962645088589366e-06, "loss": 1.1343, "step": 2770 }, { "epoch": 0.08, "learning_rate": 4.9626030682925705e-06, "loss": 1.2582, "step": 2771 }, { "epoch": 0.08, "learning_rate": 4.962561024552981e-06, "loss": 1.0654, "step": 2772 }, { "epoch": 0.08, "learning_rate": 4.962518957370995e-06, "loss": 1.2671, "step": 2773 }, { "epoch": 0.08, "learning_rate": 4.962476866747015e-06, "loss": 1.2588, "step": 2774 }, { "epoch": 0.08, "learning_rate": 4.962434752681442e-06, "loss": 1.2294, "step": 2775 }, { "epoch": 0.08, "learning_rate": 4.962392615174676e-06, "loss": 1.1812, "step": 2776 }, { "epoch": 0.08, "learning_rate": 4.962350454227118e-06, "loss": 1.2864, "step": 2777 }, { "epoch": 0.08, "learning_rate": 4.962308269839169e-06, "loss": 1.1523, "step": 2778 }, { "epoch": 0.08, "learning_rate": 4.9622660620112315e-06, "loss": 1.0493, "step": 2779 }, { "epoch": 0.08, "learning_rate": 4.962223830743707e-06, "loss": 1.1545, "step": 2780 }, { "epoch": 0.08, "learning_rate": 4.962181576036997e-06, "loss": 1.1458, "step": 2781 }, { "epoch": 0.08, "learning_rate": 4.962139297891505e-06, "loss": 1.1403, "step": 2782 }, { "epoch": 0.08, "learning_rate": 4.962096996307633e-06, "loss": 1.1707, "step": 2783 }, { "epoch": 0.08, "learning_rate": 4.962054671285782e-06, "loss": 1.0922, "step": 2784 }, { "epoch": 0.08, "learning_rate": 4.962012322826357e-06, "loss": 1.1339, "step": 2785 }, { "epoch": 0.08, "learning_rate": 4.961969950929761e-06, "loss": 1.0613, "step": 2786 }, { "epoch": 0.08, "learning_rate": 4.961927555596397e-06, "loss": 1.1302, "step": 2787 }, { "epoch": 0.08, "learning_rate": 4.961885136826667e-06, "loss": 1.2122, "step": 2788 }, { "epoch": 0.08, "learning_rate": 4.9618426946209765e-06, "loss": 1.1237, "step": 2789 }, { "epoch": 0.08, "learning_rate": 4.961800228979729e-06, "loss": 1.1555, "step": 2790 }, { "epoch": 0.08, "learning_rate": 4.96175773990333e-06, "loss": 1.1367, "step": 2791 }, { "epoch": 0.08, "learning_rate": 4.961715227392183e-06, "loss": 1.1972, "step": 2792 }, { "epoch": 0.08, "learning_rate": 4.961672691446692e-06, "loss": 1.1879, "step": 2793 }, { "epoch": 0.08, "learning_rate": 4.9616301320672626e-06, "loss": 1.2675, "step": 2794 }, { "epoch": 0.08, "learning_rate": 4.9615875492543e-06, "loss": 1.1414, "step": 2795 }, { "epoch": 0.08, "learning_rate": 4.961544943008209e-06, "loss": 1.1978, "step": 2796 }, { "epoch": 0.08, "learning_rate": 4.961502313329397e-06, "loss": 1.2128, "step": 2797 }, { "epoch": 0.08, "learning_rate": 4.961459660218267e-06, "loss": 1.2065, "step": 2798 }, { "epoch": 0.08, "learning_rate": 4.9614169836752275e-06, "loss": 1.1356, "step": 2799 }, { "epoch": 0.08, "learning_rate": 4.961374283700683e-06, "loss": 1.2502, "step": 2800 }, { "epoch": 0.08, "learning_rate": 4.9613315602950414e-06, "loss": 1.161, "step": 2801 }, { "epoch": 0.08, "learning_rate": 4.961288813458708e-06, "loss": 1.176, "step": 2802 }, { "epoch": 0.08, "learning_rate": 4.961246043192091e-06, "loss": 1.0763, "step": 2803 }, { "epoch": 0.08, "learning_rate": 4.9612032494955976e-06, "loss": 1.2213, "step": 2804 }, { "epoch": 0.08, "learning_rate": 4.961160432369634e-06, "loss": 1.2661, "step": 2805 }, { "epoch": 0.08, "learning_rate": 4.961117591814608e-06, "loss": 1.1155, "step": 2806 }, { "epoch": 0.08, "learning_rate": 4.961074727830929e-06, "loss": 1.2029, "step": 2807 }, { "epoch": 0.08, "learning_rate": 4.9610318404190025e-06, "loss": 1.1664, "step": 2808 }, { "epoch": 0.08, "learning_rate": 4.960988929579239e-06, "loss": 1.1469, "step": 2809 }, { "epoch": 0.08, "learning_rate": 4.960945995312046e-06, "loss": 1.1771, "step": 2810 }, { "epoch": 0.08, "learning_rate": 4.960903037617833e-06, "loss": 1.1181, "step": 2811 }, { "epoch": 0.08, "learning_rate": 4.960860056497007e-06, "loss": 1.1193, "step": 2812 }, { "epoch": 0.08, "learning_rate": 4.960817051949979e-06, "loss": 1.114, "step": 2813 }, { "epoch": 0.08, "learning_rate": 4.960774023977159e-06, "loss": 1.1881, "step": 2814 }, { "epoch": 0.08, "learning_rate": 4.960730972578954e-06, "loss": 1.1499, "step": 2815 }, { "epoch": 0.08, "learning_rate": 4.9606878977557756e-06, "loss": 1.172, "step": 2816 }, { "epoch": 0.08, "learning_rate": 4.960644799508033e-06, "loss": 1.1717, "step": 2817 }, { "epoch": 0.08, "learning_rate": 4.960601677836138e-06, "loss": 1.0978, "step": 2818 }, { "epoch": 0.08, "learning_rate": 4.960558532740499e-06, "loss": 1.2255, "step": 2819 }, { "epoch": 0.08, "learning_rate": 4.960515364221528e-06, "loss": 1.1669, "step": 2820 }, { "epoch": 0.08, "learning_rate": 4.960472172279637e-06, "loss": 1.1379, "step": 2821 }, { "epoch": 0.09, "learning_rate": 4.960428956915236e-06, "loss": 1.0958, "step": 2822 }, { "epoch": 0.09, "learning_rate": 4.9603857181287355e-06, "loss": 1.1822, "step": 2823 }, { "epoch": 0.09, "learning_rate": 4.960342455920547e-06, "loss": 1.152, "step": 2824 }, { "epoch": 0.09, "learning_rate": 4.9602991702910845e-06, "loss": 1.2315, "step": 2825 }, { "epoch": 0.09, "learning_rate": 4.960255861240758e-06, "loss": 1.2033, "step": 2826 }, { "epoch": 0.09, "learning_rate": 4.960212528769982e-06, "loss": 1.1248, "step": 2827 }, { "epoch": 0.09, "learning_rate": 4.960169172879166e-06, "loss": 1.132, "step": 2828 }, { "epoch": 0.09, "learning_rate": 4.960125793568725e-06, "loss": 1.199, "step": 2829 }, { "epoch": 0.09, "learning_rate": 4.960082390839072e-06, "loss": 1.0803, "step": 2830 }, { "epoch": 0.09, "learning_rate": 4.960038964690618e-06, "loss": 1.2107, "step": 2831 }, { "epoch": 0.09, "learning_rate": 4.9599955151237785e-06, "loss": 1.25, "step": 2832 }, { "epoch": 0.09, "learning_rate": 4.959952042138967e-06, "loss": 1.2112, "step": 2833 }, { "epoch": 0.09, "learning_rate": 4.959908545736596e-06, "loss": 1.2318, "step": 2834 }, { "epoch": 0.09, "learning_rate": 4.959865025917081e-06, "loss": 1.0996, "step": 2835 }, { "epoch": 0.09, "learning_rate": 4.959821482680836e-06, "loss": 1.2566, "step": 2836 }, { "epoch": 0.09, "learning_rate": 4.959777916028274e-06, "loss": 1.1031, "step": 2837 }, { "epoch": 0.09, "learning_rate": 4.959734325959812e-06, "loss": 1.1603, "step": 2838 }, { "epoch": 0.09, "learning_rate": 4.9596907124758634e-06, "loss": 1.1903, "step": 2839 }, { "epoch": 0.09, "learning_rate": 4.9596470755768435e-06, "loss": 1.1596, "step": 2840 }, { "epoch": 0.09, "learning_rate": 4.959603415263168e-06, "loss": 1.1747, "step": 2841 }, { "epoch": 0.09, "learning_rate": 4.9595597315352525e-06, "loss": 1.2148, "step": 2842 }, { "epoch": 0.09, "learning_rate": 4.959516024393514e-06, "loss": 1.0595, "step": 2843 }, { "epoch": 0.09, "learning_rate": 4.959472293838367e-06, "loss": 1.1208, "step": 2844 }, { "epoch": 0.09, "learning_rate": 4.959428539870228e-06, "loss": 1.1919, "step": 2845 }, { "epoch": 0.09, "learning_rate": 4.959384762489514e-06, "loss": 1.118, "step": 2846 }, { "epoch": 0.09, "learning_rate": 4.959340961696641e-06, "loss": 1.0518, "step": 2847 }, { "epoch": 0.09, "learning_rate": 4.959297137492027e-06, "loss": 1.1677, "step": 2848 }, { "epoch": 0.09, "learning_rate": 4.959253289876089e-06, "loss": 1.2476, "step": 2849 }, { "epoch": 0.09, "learning_rate": 4.959209418849244e-06, "loss": 1.1789, "step": 2850 }, { "epoch": 0.09, "learning_rate": 4.959165524411909e-06, "loss": 1.1125, "step": 2851 }, { "epoch": 0.09, "learning_rate": 4.959121606564503e-06, "loss": 1.1019, "step": 2852 }, { "epoch": 0.09, "learning_rate": 4.9590776653074444e-06, "loss": 1.1956, "step": 2853 }, { "epoch": 0.09, "learning_rate": 4.95903370064115e-06, "loss": 1.1256, "step": 2854 }, { "epoch": 0.09, "learning_rate": 4.958989712566039e-06, "loss": 1.095, "step": 2855 }, { "epoch": 0.09, "learning_rate": 4.95894570108253e-06, "loss": 1.201, "step": 2856 }, { "epoch": 0.09, "learning_rate": 4.958901666191042e-06, "loss": 1.1095, "step": 2857 }, { "epoch": 0.09, "learning_rate": 4.958857607891996e-06, "loss": 1.2328, "step": 2858 }, { "epoch": 0.09, "learning_rate": 4.9588135261858085e-06, "loss": 1.1558, "step": 2859 }, { "epoch": 0.09, "learning_rate": 4.9587694210729005e-06, "loss": 1.2471, "step": 2860 }, { "epoch": 0.09, "learning_rate": 4.958725292553693e-06, "loss": 1.2534, "step": 2861 }, { "epoch": 0.09, "learning_rate": 4.958681140628604e-06, "loss": 1.2735, "step": 2862 }, { "epoch": 0.09, "learning_rate": 4.9586369652980535e-06, "loss": 1.1358, "step": 2863 }, { "epoch": 0.09, "learning_rate": 4.958592766562464e-06, "loss": 1.1526, "step": 2864 }, { "epoch": 0.09, "learning_rate": 4.958548544422257e-06, "loss": 1.126, "step": 2865 }, { "epoch": 0.09, "learning_rate": 4.958504298877851e-06, "loss": 1.2223, "step": 2866 }, { "epoch": 0.09, "learning_rate": 4.958460029929667e-06, "loss": 1.0379, "step": 2867 }, { "epoch": 0.09, "learning_rate": 4.958415737578128e-06, "loss": 1.1637, "step": 2868 }, { "epoch": 0.09, "learning_rate": 4.958371421823656e-06, "loss": 1.2047, "step": 2869 }, { "epoch": 0.09, "learning_rate": 4.958327082666672e-06, "loss": 1.1865, "step": 2870 }, { "epoch": 0.09, "learning_rate": 4.958282720107598e-06, "loss": 1.1909, "step": 2871 }, { "epoch": 0.09, "learning_rate": 4.958238334146856e-06, "loss": 1.0002, "step": 2872 }, { "epoch": 0.09, "learning_rate": 4.958193924784869e-06, "loss": 1.1626, "step": 2873 }, { "epoch": 0.09, "learning_rate": 4.95814949202206e-06, "loss": 1.1014, "step": 2874 }, { "epoch": 0.09, "learning_rate": 4.958105035858851e-06, "loss": 1.1494, "step": 2875 }, { "epoch": 0.09, "learning_rate": 4.9580605562956675e-06, "loss": 1.2157, "step": 2876 }, { "epoch": 0.09, "learning_rate": 4.95801605333293e-06, "loss": 1.129, "step": 2877 }, { "epoch": 0.09, "learning_rate": 4.957971526971064e-06, "loss": 1.0671, "step": 2878 }, { "epoch": 0.09, "learning_rate": 4.957926977210492e-06, "loss": 1.1183, "step": 2879 }, { "epoch": 0.09, "learning_rate": 4.957882404051641e-06, "loss": 1.252, "step": 2880 }, { "epoch": 0.09, "learning_rate": 4.957837807494932e-06, "loss": 1.1669, "step": 2881 }, { "epoch": 0.09, "learning_rate": 4.95779318754079e-06, "loss": 1.1483, "step": 2882 }, { "epoch": 0.09, "learning_rate": 4.957748544189642e-06, "loss": 1.1284, "step": 2883 }, { "epoch": 0.09, "learning_rate": 4.957703877441911e-06, "loss": 1.2583, "step": 2884 }, { "epoch": 0.09, "learning_rate": 4.957659187298022e-06, "loss": 1.1362, "step": 2885 }, { "epoch": 0.09, "learning_rate": 4.957614473758402e-06, "loss": 1.3756, "step": 2886 }, { "epoch": 0.09, "learning_rate": 4.957569736823476e-06, "loss": 1.2623, "step": 2887 }, { "epoch": 0.09, "learning_rate": 4.95752497649367e-06, "loss": 1.2458, "step": 2888 }, { "epoch": 0.09, "learning_rate": 4.957480192769408e-06, "loss": 1.2186, "step": 2889 }, { "epoch": 0.09, "learning_rate": 4.95743538565112e-06, "loss": 1.1446, "step": 2890 }, { "epoch": 0.09, "learning_rate": 4.95739055513923e-06, "loss": 1.1368, "step": 2891 }, { "epoch": 0.09, "learning_rate": 4.957345701234165e-06, "loss": 1.0597, "step": 2892 }, { "epoch": 0.09, "learning_rate": 4.9573008239363535e-06, "loss": 1.0554, "step": 2893 }, { "epoch": 0.09, "learning_rate": 4.957255923246221e-06, "loss": 1.1425, "step": 2894 }, { "epoch": 0.09, "learning_rate": 4.957210999164196e-06, "loss": 1.1835, "step": 2895 }, { "epoch": 0.09, "learning_rate": 4.957166051690705e-06, "loss": 1.1287, "step": 2896 }, { "epoch": 0.09, "learning_rate": 4.957121080826177e-06, "loss": 1.1, "step": 2897 }, { "epoch": 0.09, "learning_rate": 4.957076086571039e-06, "loss": 1.0518, "step": 2898 }, { "epoch": 0.09, "learning_rate": 4.957031068925721e-06, "loss": 1.1307, "step": 2899 }, { "epoch": 0.09, "learning_rate": 4.9569860278906504e-06, "loss": 1.2936, "step": 2900 }, { "epoch": 0.09, "learning_rate": 4.956940963466256e-06, "loss": 1.1915, "step": 2901 }, { "epoch": 0.09, "learning_rate": 4.956895875652967e-06, "loss": 1.1116, "step": 2902 }, { "epoch": 0.09, "learning_rate": 4.956850764451212e-06, "loss": 1.1787, "step": 2903 }, { "epoch": 0.09, "learning_rate": 4.956805629861421e-06, "loss": 1.124, "step": 2904 }, { "epoch": 0.09, "learning_rate": 4.9567604718840246e-06, "loss": 1.1401, "step": 2905 }, { "epoch": 0.09, "learning_rate": 4.956715290519452e-06, "loss": 1.1183, "step": 2906 }, { "epoch": 0.09, "learning_rate": 4.956670085768132e-06, "loss": 1.1266, "step": 2907 }, { "epoch": 0.09, "learning_rate": 4.956624857630496e-06, "loss": 1.0953, "step": 2908 }, { "epoch": 0.09, "learning_rate": 4.956579606106974e-06, "loss": 1.1782, "step": 2909 }, { "epoch": 0.09, "learning_rate": 4.956534331197998e-06, "loss": 1.1417, "step": 2910 }, { "epoch": 0.09, "learning_rate": 4.956489032903998e-06, "loss": 1.1989, "step": 2911 }, { "epoch": 0.09, "learning_rate": 4.956443711225406e-06, "loss": 1.2491, "step": 2912 }, { "epoch": 0.09, "learning_rate": 4.956398366162652e-06, "loss": 1.141, "step": 2913 }, { "epoch": 0.09, "learning_rate": 4.95635299771617e-06, "loss": 1.1619, "step": 2914 }, { "epoch": 0.09, "learning_rate": 4.95630760588639e-06, "loss": 1.21, "step": 2915 }, { "epoch": 0.09, "learning_rate": 4.956262190673744e-06, "loss": 1.0958, "step": 2916 }, { "epoch": 0.09, "learning_rate": 4.9562167520786655e-06, "loss": 1.2206, "step": 2917 }, { "epoch": 0.09, "learning_rate": 4.956171290101585e-06, "loss": 1.2473, "step": 2918 }, { "epoch": 0.09, "learning_rate": 4.956125804742939e-06, "loss": 1.0616, "step": 2919 }, { "epoch": 0.09, "learning_rate": 4.956080296003157e-06, "loss": 1.2001, "step": 2920 }, { "epoch": 0.09, "learning_rate": 4.956034763882674e-06, "loss": 1.1131, "step": 2921 }, { "epoch": 0.09, "learning_rate": 4.955989208381922e-06, "loss": 1.1091, "step": 2922 }, { "epoch": 0.09, "learning_rate": 4.955943629501336e-06, "loss": 1.1005, "step": 2923 }, { "epoch": 0.09, "learning_rate": 4.95589802724135e-06, "loss": 1.078, "step": 2924 }, { "epoch": 0.09, "learning_rate": 4.955852401602398e-06, "loss": 1.1754, "step": 2925 }, { "epoch": 0.09, "learning_rate": 4.955806752584913e-06, "loss": 1.2648, "step": 2926 }, { "epoch": 0.09, "learning_rate": 4.955761080189331e-06, "loss": 1.1819, "step": 2927 }, { "epoch": 0.09, "learning_rate": 4.955715384416085e-06, "loss": 1.1382, "step": 2928 }, { "epoch": 0.09, "learning_rate": 4.955669665265612e-06, "loss": 1.2815, "step": 2929 }, { "epoch": 0.09, "learning_rate": 4.955623922738347e-06, "loss": 1.1447, "step": 2930 }, { "epoch": 0.09, "learning_rate": 4.955578156834724e-06, "loss": 1.1628, "step": 2931 }, { "epoch": 0.09, "learning_rate": 4.9555323675551806e-06, "loss": 1.194, "step": 2932 }, { "epoch": 0.09, "learning_rate": 4.955486554900152e-06, "loss": 1.149, "step": 2933 }, { "epoch": 0.09, "learning_rate": 4.955440718870073e-06, "loss": 1.1058, "step": 2934 }, { "epoch": 0.09, "learning_rate": 4.95539485946538e-06, "loss": 1.1619, "step": 2935 }, { "epoch": 0.09, "learning_rate": 4.955348976686513e-06, "loss": 1.2661, "step": 2936 }, { "epoch": 0.09, "learning_rate": 4.9553030705339045e-06, "loss": 1.1799, "step": 2937 }, { "epoch": 0.09, "learning_rate": 4.955257141007993e-06, "loss": 1.1459, "step": 2938 }, { "epoch": 0.09, "learning_rate": 4.955211188109217e-06, "loss": 1.088, "step": 2939 }, { "epoch": 0.09, "learning_rate": 4.955165211838013e-06, "loss": 1.1271, "step": 2940 }, { "epoch": 0.09, "learning_rate": 4.955119212194818e-06, "loss": 1.1577, "step": 2941 }, { "epoch": 0.09, "learning_rate": 4.955073189180071e-06, "loss": 1.1111, "step": 2942 }, { "epoch": 0.09, "learning_rate": 4.955027142794209e-06, "loss": 1.249, "step": 2943 }, { "epoch": 0.09, "learning_rate": 4.954981073037672e-06, "loss": 1.0096, "step": 2944 }, { "epoch": 0.09, "learning_rate": 4.954934979910897e-06, "loss": 1.2083, "step": 2945 }, { "epoch": 0.09, "learning_rate": 4.954888863414323e-06, "loss": 1.1092, "step": 2946 }, { "epoch": 0.09, "learning_rate": 4.95484272354839e-06, "loss": 1.1303, "step": 2947 }, { "epoch": 0.09, "learning_rate": 4.954796560313536e-06, "loss": 1.1561, "step": 2948 }, { "epoch": 0.09, "learning_rate": 4.9547503737102005e-06, "loss": 1.2074, "step": 2949 }, { "epoch": 0.09, "learning_rate": 4.954704163738825e-06, "loss": 1.2646, "step": 2950 }, { "epoch": 0.09, "learning_rate": 4.954657930399848e-06, "loss": 1.2678, "step": 2951 }, { "epoch": 0.09, "learning_rate": 4.954611673693709e-06, "loss": 1.1319, "step": 2952 }, { "epoch": 0.09, "learning_rate": 4.954565393620849e-06, "loss": 1.0924, "step": 2953 }, { "epoch": 0.09, "learning_rate": 4.954519090181709e-06, "loss": 1.1284, "step": 2954 }, { "epoch": 0.09, "learning_rate": 4.95447276337673e-06, "loss": 1.1402, "step": 2955 }, { "epoch": 0.09, "learning_rate": 4.954426413206351e-06, "loss": 1.2806, "step": 2956 }, { "epoch": 0.09, "learning_rate": 4.954380039671016e-06, "loss": 1.0561, "step": 2957 }, { "epoch": 0.09, "learning_rate": 4.954333642771164e-06, "loss": 1.1332, "step": 2958 }, { "epoch": 0.09, "learning_rate": 4.954287222507238e-06, "loss": 1.1481, "step": 2959 }, { "epoch": 0.09, "learning_rate": 4.9542407788796796e-06, "loss": 1.2453, "step": 2960 }, { "epoch": 0.09, "learning_rate": 4.954194311888932e-06, "loss": 1.179, "step": 2961 }, { "epoch": 0.09, "learning_rate": 4.954147821535435e-06, "loss": 1.1689, "step": 2962 }, { "epoch": 0.09, "learning_rate": 4.954101307819634e-06, "loss": 1.1328, "step": 2963 }, { "epoch": 0.09, "learning_rate": 4.954054770741969e-06, "loss": 1.0934, "step": 2964 }, { "epoch": 0.09, "learning_rate": 4.9540082103028865e-06, "loss": 1.1627, "step": 2965 }, { "epoch": 0.09, "learning_rate": 4.9539616265028266e-06, "loss": 1.1274, "step": 2966 }, { "epoch": 0.09, "learning_rate": 4.953915019342234e-06, "loss": 1.1003, "step": 2967 }, { "epoch": 0.09, "learning_rate": 4.953868388821552e-06, "loss": 1.2547, "step": 2968 }, { "epoch": 0.09, "learning_rate": 4.953821734941226e-06, "loss": 1.146, "step": 2969 }, { "epoch": 0.09, "learning_rate": 4.953775057701698e-06, "loss": 1.2314, "step": 2970 }, { "epoch": 0.09, "learning_rate": 4.9537283571034125e-06, "loss": 1.0841, "step": 2971 }, { "epoch": 0.09, "learning_rate": 4.953681633146815e-06, "loss": 1.2333, "step": 2972 }, { "epoch": 0.09, "learning_rate": 4.95363488583235e-06, "loss": 1.1464, "step": 2973 }, { "epoch": 0.09, "learning_rate": 4.953588115160463e-06, "loss": 1.1412, "step": 2974 }, { "epoch": 0.09, "learning_rate": 4.9535413211316e-06, "loss": 1.106, "step": 2975 }, { "epoch": 0.09, "learning_rate": 4.953494503746203e-06, "loss": 1.1857, "step": 2976 }, { "epoch": 0.09, "learning_rate": 4.953447663004723e-06, "loss": 1.1918, "step": 2977 }, { "epoch": 0.09, "learning_rate": 4.9534007989076e-06, "loss": 1.199, "step": 2978 }, { "epoch": 0.09, "learning_rate": 4.9533539114552845e-06, "loss": 1.1473, "step": 2979 }, { "epoch": 0.09, "learning_rate": 4.95330700064822e-06, "loss": 1.174, "step": 2980 }, { "epoch": 0.09, "learning_rate": 4.953260066486856e-06, "loss": 1.2944, "step": 2981 }, { "epoch": 0.09, "learning_rate": 4.9532131089716365e-06, "loss": 1.0835, "step": 2982 }, { "epoch": 0.09, "learning_rate": 4.9531661281030104e-06, "loss": 1.1403, "step": 2983 }, { "epoch": 0.09, "learning_rate": 4.953119123881424e-06, "loss": 1.053, "step": 2984 }, { "epoch": 0.09, "learning_rate": 4.953072096307325e-06, "loss": 1.164, "step": 2985 }, { "epoch": 0.09, "learning_rate": 4.953025045381161e-06, "loss": 1.0737, "step": 2986 }, { "epoch": 0.09, "learning_rate": 4.95297797110338e-06, "loss": 1.2275, "step": 2987 }, { "epoch": 0.09, "learning_rate": 4.952930873474431e-06, "loss": 1.0624, "step": 2988 }, { "epoch": 0.09, "learning_rate": 4.95288375249476e-06, "loss": 1.243, "step": 2989 }, { "epoch": 0.09, "learning_rate": 4.952836608164818e-06, "loss": 1.1124, "step": 2990 }, { "epoch": 0.09, "learning_rate": 4.952789440485053e-06, "loss": 1.1404, "step": 2991 }, { "epoch": 0.09, "learning_rate": 4.952742249455913e-06, "loss": 1.1454, "step": 2992 }, { "epoch": 0.09, "learning_rate": 4.952695035077848e-06, "loss": 1.2654, "step": 2993 }, { "epoch": 0.09, "learning_rate": 4.952647797351308e-06, "loss": 1.1131, "step": 2994 }, { "epoch": 0.09, "learning_rate": 4.952600536276743e-06, "loss": 1.2073, "step": 2995 }, { "epoch": 0.09, "learning_rate": 4.9525532518546e-06, "loss": 1.1879, "step": 2996 }, { "epoch": 0.09, "learning_rate": 4.952505944085333e-06, "loss": 1.1146, "step": 2997 }, { "epoch": 0.09, "learning_rate": 4.95245861296939e-06, "loss": 1.1635, "step": 2998 }, { "epoch": 0.09, "learning_rate": 4.952411258507223e-06, "loss": 1.2443, "step": 2999 }, { "epoch": 0.09, "learning_rate": 4.95236388069928e-06, "loss": 1.0307, "step": 3000 }, { "epoch": 0.09, "learning_rate": 4.952316479546015e-06, "loss": 1.1652, "step": 3001 }, { "epoch": 0.09, "learning_rate": 4.9522690550478795e-06, "loss": 1.1127, "step": 3002 }, { "epoch": 0.09, "learning_rate": 4.9522216072053216e-06, "loss": 1.2559, "step": 3003 }, { "epoch": 0.09, "learning_rate": 4.952174136018796e-06, "loss": 1.0496, "step": 3004 }, { "epoch": 0.09, "learning_rate": 4.952126641488754e-06, "loss": 1.2035, "step": 3005 }, { "epoch": 0.09, "learning_rate": 4.952079123615647e-06, "loss": 1.1141, "step": 3006 }, { "epoch": 0.09, "learning_rate": 4.952031582399927e-06, "loss": 1.1975, "step": 3007 }, { "epoch": 0.09, "learning_rate": 4.951984017842048e-06, "loss": 1.1378, "step": 3008 }, { "epoch": 0.09, "learning_rate": 4.951936429942462e-06, "loss": 1.1065, "step": 3009 }, { "epoch": 0.09, "learning_rate": 4.951888818701623e-06, "loss": 1.0911, "step": 3010 }, { "epoch": 0.09, "learning_rate": 4.951841184119981e-06, "loss": 1.174, "step": 3011 }, { "epoch": 0.09, "learning_rate": 4.951793526197993e-06, "loss": 1.055, "step": 3012 }, { "epoch": 0.09, "learning_rate": 4.951745844936112e-06, "loss": 1.2589, "step": 3013 }, { "epoch": 0.09, "learning_rate": 4.951698140334791e-06, "loss": 1.1311, "step": 3014 }, { "epoch": 0.09, "learning_rate": 4.951650412394484e-06, "loss": 1.162, "step": 3015 }, { "epoch": 0.09, "learning_rate": 4.951602661115647e-06, "loss": 1.1169, "step": 3016 }, { "epoch": 0.09, "learning_rate": 4.9515548864987315e-06, "loss": 1.1342, "step": 3017 }, { "epoch": 0.09, "learning_rate": 4.951507088544196e-06, "loss": 1.2395, "step": 3018 }, { "epoch": 0.09, "learning_rate": 4.951459267252493e-06, "loss": 1.0309, "step": 3019 }, { "epoch": 0.09, "learning_rate": 4.9514114226240785e-06, "loss": 1.1552, "step": 3020 }, { "epoch": 0.09, "learning_rate": 4.951363554659408e-06, "loss": 1.116, "step": 3021 }, { "epoch": 0.09, "learning_rate": 4.951315663358936e-06, "loss": 1.1329, "step": 3022 }, { "epoch": 0.09, "learning_rate": 4.951267748723121e-06, "loss": 1.2539, "step": 3023 }, { "epoch": 0.09, "learning_rate": 4.951219810752417e-06, "loss": 1.1234, "step": 3024 }, { "epoch": 0.09, "learning_rate": 4.951171849447281e-06, "loss": 1.2551, "step": 3025 }, { "epoch": 0.09, "learning_rate": 4.9511238648081695e-06, "loss": 1.1614, "step": 3026 }, { "epoch": 0.09, "learning_rate": 4.951075856835539e-06, "loss": 1.1934, "step": 3027 }, { "epoch": 0.09, "learning_rate": 4.951027825529847e-06, "loss": 1.1982, "step": 3028 }, { "epoch": 0.09, "learning_rate": 4.950979770891551e-06, "loss": 1.2494, "step": 3029 }, { "epoch": 0.09, "learning_rate": 4.950931692921107e-06, "loss": 1.1052, "step": 3030 }, { "epoch": 0.09, "learning_rate": 4.950883591618974e-06, "loss": 1.1008, "step": 3031 }, { "epoch": 0.09, "learning_rate": 4.950835466985611e-06, "loss": 1.1154, "step": 3032 }, { "epoch": 0.09, "learning_rate": 4.9507873190214735e-06, "loss": 1.1808, "step": 3033 }, { "epoch": 0.09, "learning_rate": 4.950739147727022e-06, "loss": 1.1859, "step": 3034 }, { "epoch": 0.09, "learning_rate": 4.9506909531027125e-06, "loss": 1.1058, "step": 3035 }, { "epoch": 0.09, "learning_rate": 4.950642735149007e-06, "loss": 1.1637, "step": 3036 }, { "epoch": 0.09, "learning_rate": 4.950594493866362e-06, "loss": 1.1268, "step": 3037 }, { "epoch": 0.09, "learning_rate": 4.9505462292552375e-06, "loss": 1.215, "step": 3038 }, { "epoch": 0.09, "learning_rate": 4.9504979413160936e-06, "loss": 1.1657, "step": 3039 }, { "epoch": 0.09, "learning_rate": 4.9504496300493895e-06, "loss": 1.1212, "step": 3040 }, { "epoch": 0.09, "learning_rate": 4.9504012954555845e-06, "loss": 1.1094, "step": 3041 }, { "epoch": 0.09, "learning_rate": 4.95035293753514e-06, "loss": 1.1282, "step": 3042 }, { "epoch": 0.09, "learning_rate": 4.950304556288515e-06, "loss": 1.2154, "step": 3043 }, { "epoch": 0.09, "learning_rate": 4.950256151716172e-06, "loss": 1.2187, "step": 3044 }, { "epoch": 0.09, "learning_rate": 4.95020772381857e-06, "loss": 1.1254, "step": 3045 }, { "epoch": 0.09, "learning_rate": 4.95015927259617e-06, "loss": 1.0997, "step": 3046 }, { "epoch": 0.09, "learning_rate": 4.950110798049434e-06, "loss": 1.166, "step": 3047 }, { "epoch": 0.09, "learning_rate": 4.9500623001788225e-06, "loss": 1.2461, "step": 3048 }, { "epoch": 0.09, "learning_rate": 4.950013778984799e-06, "loss": 1.1938, "step": 3049 }, { "epoch": 0.09, "learning_rate": 4.949965234467824e-06, "loss": 1.207, "step": 3050 }, { "epoch": 0.09, "learning_rate": 4.94991666662836e-06, "loss": 1.1436, "step": 3051 }, { "epoch": 0.09, "learning_rate": 4.9498680754668695e-06, "loss": 1.1876, "step": 3052 }, { "epoch": 0.09, "learning_rate": 4.949819460983814e-06, "loss": 1.129, "step": 3053 }, { "epoch": 0.09, "learning_rate": 4.9497708231796576e-06, "loss": 1.1506, "step": 3054 }, { "epoch": 0.09, "learning_rate": 4.949722162054863e-06, "loss": 1.1866, "step": 3055 }, { "epoch": 0.09, "learning_rate": 4.949673477609893e-06, "loss": 1.2469, "step": 3056 }, { "epoch": 0.09, "learning_rate": 4.949624769845211e-06, "loss": 1.0456, "step": 3057 }, { "epoch": 0.09, "learning_rate": 4.9495760387612816e-06, "loss": 1.1716, "step": 3058 }, { "epoch": 0.09, "learning_rate": 4.949527284358567e-06, "loss": 1.1522, "step": 3059 }, { "epoch": 0.09, "learning_rate": 4.949478506637533e-06, "loss": 1.1436, "step": 3060 }, { "epoch": 0.09, "learning_rate": 4.949429705598644e-06, "loss": 1.1643, "step": 3061 }, { "epoch": 0.09, "learning_rate": 4.949380881242363e-06, "loss": 1.0874, "step": 3062 }, { "epoch": 0.09, "learning_rate": 4.949332033569156e-06, "loss": 1.0877, "step": 3063 }, { "epoch": 0.09, "learning_rate": 4.949283162579488e-06, "loss": 1.1614, "step": 3064 }, { "epoch": 0.09, "learning_rate": 4.949234268273824e-06, "loss": 1.0795, "step": 3065 }, { "epoch": 0.09, "learning_rate": 4.949185350652628e-06, "loss": 1.1821, "step": 3066 }, { "epoch": 0.09, "learning_rate": 4.949136409716369e-06, "loss": 1.1685, "step": 3067 }, { "epoch": 0.09, "learning_rate": 4.949087445465509e-06, "loss": 1.2958, "step": 3068 }, { "epoch": 0.09, "learning_rate": 4.949038457900517e-06, "loss": 1.1119, "step": 3069 }, { "epoch": 0.09, "learning_rate": 4.9489894470218584e-06, "loss": 1.1686, "step": 3070 }, { "epoch": 0.09, "learning_rate": 4.94894041283e-06, "loss": 1.1072, "step": 3071 }, { "epoch": 0.09, "learning_rate": 4.9488913553254074e-06, "loss": 1.1416, "step": 3072 }, { "epoch": 0.09, "learning_rate": 4.94884227450855e-06, "loss": 1.2028, "step": 3073 }, { "epoch": 0.09, "learning_rate": 4.948793170379892e-06, "loss": 1.1866, "step": 3074 }, { "epoch": 0.09, "learning_rate": 4.948744042939903e-06, "loss": 1.135, "step": 3075 }, { "epoch": 0.09, "learning_rate": 4.9486948921890495e-06, "loss": 1.1364, "step": 3076 }, { "epoch": 0.09, "learning_rate": 4.9486457181278016e-06, "loss": 1.178, "step": 3077 }, { "epoch": 0.09, "learning_rate": 4.9485965207566245e-06, "loss": 1.1921, "step": 3078 }, { "epoch": 0.09, "learning_rate": 4.9485473000759875e-06, "loss": 1.2326, "step": 3079 }, { "epoch": 0.09, "learning_rate": 4.948498056086361e-06, "loss": 1.233, "step": 3080 }, { "epoch": 0.09, "learning_rate": 4.94844878878821e-06, "loss": 1.2241, "step": 3081 }, { "epoch": 0.09, "learning_rate": 4.9483994981820075e-06, "loss": 1.092, "step": 3082 }, { "epoch": 0.09, "learning_rate": 4.94835018426822e-06, "loss": 1.0873, "step": 3083 }, { "epoch": 0.09, "learning_rate": 4.9483008470473186e-06, "loss": 1.1432, "step": 3084 }, { "epoch": 0.09, "learning_rate": 4.9482514865197726e-06, "loss": 1.0893, "step": 3085 }, { "epoch": 0.09, "learning_rate": 4.948202102686051e-06, "loss": 1.2275, "step": 3086 }, { "epoch": 0.09, "learning_rate": 4.948152695546624e-06, "loss": 1.0777, "step": 3087 }, { "epoch": 0.09, "learning_rate": 4.948103265101964e-06, "loss": 1.0773, "step": 3088 }, { "epoch": 0.09, "learning_rate": 4.948053811352538e-06, "loss": 1.0984, "step": 3089 }, { "epoch": 0.09, "learning_rate": 4.948004334298819e-06, "loss": 1.1216, "step": 3090 }, { "epoch": 0.09, "learning_rate": 4.947954833941279e-06, "loss": 1.2062, "step": 3091 }, { "epoch": 0.09, "learning_rate": 4.947905310280388e-06, "loss": 1.2548, "step": 3092 }, { "epoch": 0.09, "learning_rate": 4.947855763316616e-06, "loss": 1.224, "step": 3093 }, { "epoch": 0.09, "learning_rate": 4.947806193050436e-06, "loss": 1.2088, "step": 3094 }, { "epoch": 0.09, "learning_rate": 4.947756599482321e-06, "loss": 1.1069, "step": 3095 }, { "epoch": 0.09, "learning_rate": 4.947706982612742e-06, "loss": 1.1532, "step": 3096 }, { "epoch": 0.09, "learning_rate": 4.947657342442171e-06, "loss": 1.1392, "step": 3097 }, { "epoch": 0.09, "learning_rate": 4.947607678971082e-06, "loss": 1.1431, "step": 3098 }, { "epoch": 0.09, "learning_rate": 4.9475579921999455e-06, "loss": 1.1683, "step": 3099 }, { "epoch": 0.09, "learning_rate": 4.947508282129235e-06, "loss": 1.239, "step": 3100 }, { "epoch": 0.09, "learning_rate": 4.9474585487594265e-06, "loss": 1.1583, "step": 3101 }, { "epoch": 0.09, "learning_rate": 4.94740879209099e-06, "loss": 1.1873, "step": 3102 }, { "epoch": 0.09, "learning_rate": 4.947359012124401e-06, "loss": 1.1223, "step": 3103 }, { "epoch": 0.09, "learning_rate": 4.947309208860132e-06, "loss": 1.1236, "step": 3104 }, { "epoch": 0.09, "learning_rate": 4.947259382298659e-06, "loss": 1.0648, "step": 3105 }, { "epoch": 0.09, "learning_rate": 4.947209532440455e-06, "loss": 1.1274, "step": 3106 }, { "epoch": 0.09, "learning_rate": 4.947159659285994e-06, "loss": 1.2524, "step": 3107 }, { "epoch": 0.09, "learning_rate": 4.947109762835753e-06, "loss": 1.0714, "step": 3108 }, { "epoch": 0.09, "learning_rate": 4.947059843090205e-06, "loss": 1.1623, "step": 3109 }, { "epoch": 0.09, "learning_rate": 4.947009900049826e-06, "loss": 1.046, "step": 3110 }, { "epoch": 0.09, "learning_rate": 4.946959933715091e-06, "loss": 1.1246, "step": 3111 }, { "epoch": 0.09, "learning_rate": 4.946909944086477e-06, "loss": 1.191, "step": 3112 }, { "epoch": 0.09, "learning_rate": 4.946859931164457e-06, "loss": 1.1734, "step": 3113 }, { "epoch": 0.09, "learning_rate": 4.94680989494951e-06, "loss": 1.0986, "step": 3114 }, { "epoch": 0.09, "learning_rate": 4.946759835442111e-06, "loss": 1.2231, "step": 3115 }, { "epoch": 0.09, "learning_rate": 4.9467097526427365e-06, "loss": 1.1915, "step": 3116 }, { "epoch": 0.09, "learning_rate": 4.946659646551864e-06, "loss": 1.1704, "step": 3117 }, { "epoch": 0.09, "learning_rate": 4.94660951716997e-06, "loss": 1.2746, "step": 3118 }, { "epoch": 0.09, "learning_rate": 4.946559364497532e-06, "loss": 1.2865, "step": 3119 }, { "epoch": 0.09, "learning_rate": 4.9465091885350265e-06, "loss": 1.0979, "step": 3120 }, { "epoch": 0.09, "learning_rate": 4.946458989282932e-06, "loss": 1.0971, "step": 3121 }, { "epoch": 0.09, "learning_rate": 4.946408766741726e-06, "loss": 1.1631, "step": 3122 }, { "epoch": 0.09, "learning_rate": 4.946358520911887e-06, "loss": 1.2045, "step": 3123 }, { "epoch": 0.09, "learning_rate": 4.9463082517938934e-06, "loss": 1.0795, "step": 3124 }, { "epoch": 0.09, "learning_rate": 4.946257959388223e-06, "loss": 1.252, "step": 3125 }, { "epoch": 0.09, "learning_rate": 4.946207643695355e-06, "loss": 1.205, "step": 3126 }, { "epoch": 0.09, "learning_rate": 4.9461573047157686e-06, "loss": 1.1415, "step": 3127 }, { "epoch": 0.09, "learning_rate": 4.946106942449942e-06, "loss": 1.1571, "step": 3128 }, { "epoch": 0.09, "learning_rate": 4.946056556898357e-06, "loss": 1.0463, "step": 3129 }, { "epoch": 0.09, "learning_rate": 4.94600614806149e-06, "loss": 1.2162, "step": 3130 }, { "epoch": 0.09, "learning_rate": 4.945955715939823e-06, "loss": 1.137, "step": 3131 }, { "epoch": 0.09, "learning_rate": 4.945905260533836e-06, "loss": 1.1024, "step": 3132 }, { "epoch": 0.09, "learning_rate": 4.945854781844009e-06, "loss": 1.1042, "step": 3133 }, { "epoch": 0.09, "learning_rate": 4.945804279870822e-06, "loss": 1.1397, "step": 3134 }, { "epoch": 0.09, "learning_rate": 4.945753754614756e-06, "loss": 1.1523, "step": 3135 }, { "epoch": 0.09, "learning_rate": 4.945703206076293e-06, "loss": 1.2143, "step": 3136 }, { "epoch": 0.09, "learning_rate": 4.945652634255912e-06, "loss": 1.1299, "step": 3137 }, { "epoch": 0.09, "learning_rate": 4.945602039154097e-06, "loss": 1.328, "step": 3138 }, { "epoch": 0.09, "learning_rate": 4.945551420771329e-06, "loss": 1.0591, "step": 3139 }, { "epoch": 0.09, "learning_rate": 4.945500779108088e-06, "loss": 1.1744, "step": 3140 }, { "epoch": 0.09, "learning_rate": 4.945450114164858e-06, "loss": 1.1287, "step": 3141 }, { "epoch": 0.09, "learning_rate": 4.94539942594212e-06, "loss": 1.1609, "step": 3142 }, { "epoch": 0.09, "learning_rate": 4.945348714440357e-06, "loss": 1.1583, "step": 3143 }, { "epoch": 0.09, "learning_rate": 4.945297979660053e-06, "loss": 1.0555, "step": 3144 }, { "epoch": 0.09, "learning_rate": 4.94524722160169e-06, "loss": 1.1729, "step": 3145 }, { "epoch": 0.09, "learning_rate": 4.94519644026575e-06, "loss": 1.1287, "step": 3146 }, { "epoch": 0.09, "learning_rate": 4.9451456356527184e-06, "loss": 1.0883, "step": 3147 }, { "epoch": 0.09, "learning_rate": 4.945094807763078e-06, "loss": 1.1818, "step": 3148 }, { "epoch": 0.09, "learning_rate": 4.945043956597312e-06, "loss": 1.1029, "step": 3149 }, { "epoch": 0.09, "learning_rate": 4.944993082155906e-06, "loss": 1.1542, "step": 3150 }, { "epoch": 0.09, "learning_rate": 4.944942184439343e-06, "loss": 1.155, "step": 3151 }, { "epoch": 0.09, "learning_rate": 4.944891263448108e-06, "loss": 1.1722, "step": 3152 }, { "epoch": 0.09, "learning_rate": 4.944840319182685e-06, "loss": 1.196, "step": 3153 }, { "epoch": 0.1, "learning_rate": 4.94478935164356e-06, "loss": 1.2339, "step": 3154 }, { "epoch": 0.1, "learning_rate": 4.9447383608312185e-06, "loss": 1.3003, "step": 3155 }, { "epoch": 0.1, "learning_rate": 4.9446873467461445e-06, "loss": 1.3044, "step": 3156 }, { "epoch": 0.1, "learning_rate": 4.944636309388824e-06, "loss": 1.1417, "step": 3157 }, { "epoch": 0.1, "learning_rate": 4.944585248759744e-06, "loss": 1.1194, "step": 3158 }, { "epoch": 0.1, "learning_rate": 4.944534164859389e-06, "loss": 1.2091, "step": 3159 }, { "epoch": 0.1, "learning_rate": 4.944483057688248e-06, "loss": 1.1187, "step": 3160 }, { "epoch": 0.1, "learning_rate": 4.944431927246803e-06, "loss": 1.1237, "step": 3161 }, { "epoch": 0.1, "learning_rate": 4.944380773535545e-06, "loss": 1.3811, "step": 3162 }, { "epoch": 0.1, "learning_rate": 4.944329596554959e-06, "loss": 1.0936, "step": 3163 }, { "epoch": 0.1, "learning_rate": 4.944278396305532e-06, "loss": 1.1062, "step": 3164 }, { "epoch": 0.1, "learning_rate": 4.944227172787752e-06, "loss": 1.0694, "step": 3165 }, { "epoch": 0.1, "learning_rate": 4.9441759260021076e-06, "loss": 1.1559, "step": 3166 }, { "epoch": 0.1, "learning_rate": 4.944124655949084e-06, "loss": 1.2209, "step": 3167 }, { "epoch": 0.1, "learning_rate": 4.944073362629171e-06, "loss": 1.1547, "step": 3168 }, { "epoch": 0.1, "learning_rate": 4.9440220460428575e-06, "loss": 1.1335, "step": 3169 }, { "epoch": 0.1, "learning_rate": 4.9439707061906305e-06, "loss": 1.3018, "step": 3170 }, { "epoch": 0.1, "learning_rate": 4.94391934307298e-06, "loss": 1.1504, "step": 3171 }, { "epoch": 0.1, "learning_rate": 4.943867956690394e-06, "loss": 1.1912, "step": 3172 }, { "epoch": 0.1, "learning_rate": 4.943816547043362e-06, "loss": 1.1115, "step": 3173 }, { "epoch": 0.1, "learning_rate": 4.943765114132374e-06, "loss": 1.3207, "step": 3174 }, { "epoch": 0.1, "learning_rate": 4.9437136579579185e-06, "loss": 1.056, "step": 3175 }, { "epoch": 0.1, "learning_rate": 4.943662178520486e-06, "loss": 1.0392, "step": 3176 }, { "epoch": 0.1, "learning_rate": 4.943610675820567e-06, "loss": 1.1793, "step": 3177 }, { "epoch": 0.1, "learning_rate": 4.943559149858651e-06, "loss": 1.0989, "step": 3178 }, { "epoch": 0.1, "learning_rate": 4.943507600635229e-06, "loss": 1.1898, "step": 3179 }, { "epoch": 0.1, "learning_rate": 4.94345602815079e-06, "loss": 1.1816, "step": 3180 }, { "epoch": 0.1, "learning_rate": 4.943404432405828e-06, "loss": 1.2255, "step": 3181 }, { "epoch": 0.1, "learning_rate": 4.943352813400832e-06, "loss": 1.1296, "step": 3182 }, { "epoch": 0.1, "learning_rate": 4.943301171136294e-06, "loss": 1.1248, "step": 3183 }, { "epoch": 0.1, "learning_rate": 4.943249505612705e-06, "loss": 1.0747, "step": 3184 }, { "epoch": 0.1, "learning_rate": 4.943197816830559e-06, "loss": 1.1115, "step": 3185 }, { "epoch": 0.1, "learning_rate": 4.943146104790345e-06, "loss": 1.132, "step": 3186 }, { "epoch": 0.1, "learning_rate": 4.943094369492558e-06, "loss": 1.1797, "step": 3187 }, { "epoch": 0.1, "learning_rate": 4.9430426109376885e-06, "loss": 1.2031, "step": 3188 }, { "epoch": 0.1, "learning_rate": 4.9429908291262295e-06, "loss": 1.1906, "step": 3189 }, { "epoch": 0.1, "learning_rate": 4.942939024058675e-06, "loss": 1.0386, "step": 3190 }, { "epoch": 0.1, "learning_rate": 4.942887195735518e-06, "loss": 1.1169, "step": 3191 }, { "epoch": 0.1, "learning_rate": 4.94283534415725e-06, "loss": 1.1697, "step": 3192 }, { "epoch": 0.1, "learning_rate": 4.9427834693243674e-06, "loss": 1.1342, "step": 3193 }, { "epoch": 0.1, "learning_rate": 4.942731571237361e-06, "loss": 1.3251, "step": 3194 }, { "epoch": 0.1, "learning_rate": 4.942679649896729e-06, "loss": 1.2008, "step": 3195 }, { "epoch": 0.1, "learning_rate": 4.942627705302962e-06, "loss": 1.2267, "step": 3196 }, { "epoch": 0.1, "learning_rate": 4.9425757374565545e-06, "loss": 1.2269, "step": 3197 }, { "epoch": 0.1, "learning_rate": 4.942523746358004e-06, "loss": 1.2325, "step": 3198 }, { "epoch": 0.1, "learning_rate": 4.942471732007802e-06, "loss": 1.1465, "step": 3199 }, { "epoch": 0.1, "learning_rate": 4.942419694406447e-06, "loss": 1.1619, "step": 3200 }, { "epoch": 0.1, "learning_rate": 4.942367633554432e-06, "loss": 1.1921, "step": 3201 }, { "epoch": 0.1, "learning_rate": 4.942315549452254e-06, "loss": 1.1981, "step": 3202 }, { "epoch": 0.1, "learning_rate": 4.9422634421004075e-06, "loss": 1.1534, "step": 3203 }, { "epoch": 0.1, "learning_rate": 4.942211311499391e-06, "loss": 1.1879, "step": 3204 }, { "epoch": 0.1, "learning_rate": 4.942159157649698e-06, "loss": 1.1458, "step": 3205 }, { "epoch": 0.1, "learning_rate": 4.942106980551825e-06, "loss": 1.0948, "step": 3206 }, { "epoch": 0.1, "learning_rate": 4.942054780206271e-06, "loss": 1.1998, "step": 3207 }, { "epoch": 0.1, "learning_rate": 4.942002556613531e-06, "loss": 1.0822, "step": 3208 }, { "epoch": 0.1, "learning_rate": 4.941950309774103e-06, "loss": 1.1339, "step": 3209 }, { "epoch": 0.1, "learning_rate": 4.941898039688484e-06, "loss": 1.0731, "step": 3210 }, { "epoch": 0.1, "learning_rate": 4.941845746357171e-06, "loss": 1.2609, "step": 3211 }, { "epoch": 0.1, "learning_rate": 4.941793429780663e-06, "loss": 1.1724, "step": 3212 }, { "epoch": 0.1, "learning_rate": 4.941741089959459e-06, "loss": 1.1368, "step": 3213 }, { "epoch": 0.1, "learning_rate": 4.941688726894054e-06, "loss": 1.1832, "step": 3214 }, { "epoch": 0.1, "learning_rate": 4.941636340584949e-06, "loss": 1.1823, "step": 3215 }, { "epoch": 0.1, "learning_rate": 4.941583931032642e-06, "loss": 1.1663, "step": 3216 }, { "epoch": 0.1, "learning_rate": 4.9415314982376314e-06, "loss": 1.1896, "step": 3217 }, { "epoch": 0.1, "learning_rate": 4.941479042200417e-06, "loss": 1.2441, "step": 3218 }, { "epoch": 0.1, "learning_rate": 4.941426562921498e-06, "loss": 1.2274, "step": 3219 }, { "epoch": 0.1, "learning_rate": 4.941374060401375e-06, "loss": 1.0997, "step": 3220 }, { "epoch": 0.1, "learning_rate": 4.941321534640546e-06, "loss": 1.1738, "step": 3221 }, { "epoch": 0.1, "learning_rate": 4.941268985639512e-06, "loss": 1.1628, "step": 3222 }, { "epoch": 0.1, "learning_rate": 4.9412164133987725e-06, "loss": 1.2013, "step": 3223 }, { "epoch": 0.1, "learning_rate": 4.941163817918828e-06, "loss": 1.302, "step": 3224 }, { "epoch": 0.1, "learning_rate": 4.941111199200181e-06, "loss": 1.2356, "step": 3225 }, { "epoch": 0.1, "learning_rate": 4.94105855724333e-06, "loss": 1.1663, "step": 3226 }, { "epoch": 0.1, "learning_rate": 4.941005892048778e-06, "loss": 1.144, "step": 3227 }, { "epoch": 0.1, "learning_rate": 4.940953203617025e-06, "loss": 1.1669, "step": 3228 }, { "epoch": 0.1, "learning_rate": 4.9409004919485725e-06, "loss": 1.1443, "step": 3229 }, { "epoch": 0.1, "learning_rate": 4.940847757043924e-06, "loss": 1.2047, "step": 3230 }, { "epoch": 0.1, "learning_rate": 4.94079499890358e-06, "loss": 1.1426, "step": 3231 }, { "epoch": 0.1, "learning_rate": 4.940742217528043e-06, "loss": 1.1597, "step": 3232 }, { "epoch": 0.1, "learning_rate": 4.940689412917815e-06, "loss": 1.1186, "step": 3233 }, { "epoch": 0.1, "learning_rate": 4.9406365850734e-06, "loss": 1.1689, "step": 3234 }, { "epoch": 0.1, "learning_rate": 4.940583733995301e-06, "loss": 1.1313, "step": 3235 }, { "epoch": 0.1, "learning_rate": 4.9405308596840195e-06, "loss": 1.3175, "step": 3236 }, { "epoch": 0.1, "learning_rate": 4.940477962140059e-06, "loss": 1.1793, "step": 3237 }, { "epoch": 0.1, "learning_rate": 4.940425041363924e-06, "loss": 1.213, "step": 3238 }, { "epoch": 0.1, "learning_rate": 4.940372097356119e-06, "loss": 1.1903, "step": 3239 }, { "epoch": 0.1, "learning_rate": 4.940319130117146e-06, "loss": 1.1159, "step": 3240 }, { "epoch": 0.1, "learning_rate": 4.94026613964751e-06, "loss": 1.0696, "step": 3241 }, { "epoch": 0.1, "learning_rate": 4.940213125947716e-06, "loss": 1.1241, "step": 3242 }, { "epoch": 0.1, "learning_rate": 4.940160089018268e-06, "loss": 1.1562, "step": 3243 }, { "epoch": 0.1, "learning_rate": 4.940107028859672e-06, "loss": 1.1665, "step": 3244 }, { "epoch": 0.1, "learning_rate": 4.940053945472431e-06, "loss": 1.2174, "step": 3245 }, { "epoch": 0.1, "learning_rate": 4.940000838857053e-06, "loss": 1.1779, "step": 3246 }, { "epoch": 0.1, "learning_rate": 4.939947709014041e-06, "loss": 1.1841, "step": 3247 }, { "epoch": 0.1, "learning_rate": 4.939894555943903e-06, "loss": 1.1656, "step": 3248 }, { "epoch": 0.1, "learning_rate": 4.9398413796471425e-06, "loss": 1.1201, "step": 3249 }, { "epoch": 0.1, "learning_rate": 4.939788180124269e-06, "loss": 1.2313, "step": 3250 }, { "epoch": 0.1, "learning_rate": 4.939734957375785e-06, "loss": 1.0853, "step": 3251 }, { "epoch": 0.1, "learning_rate": 4.939681711402201e-06, "loss": 1.2091, "step": 3252 }, { "epoch": 0.1, "learning_rate": 4.939628442204021e-06, "loss": 1.1669, "step": 3253 }, { "epoch": 0.1, "learning_rate": 4.9395751497817535e-06, "loss": 1.1957, "step": 3254 }, { "epoch": 0.1, "learning_rate": 4.939521834135905e-06, "loss": 1.2679, "step": 3255 }, { "epoch": 0.1, "learning_rate": 4.939468495266984e-06, "loss": 1.2571, "step": 3256 }, { "epoch": 0.1, "learning_rate": 4.939415133175498e-06, "loss": 1.2072, "step": 3257 }, { "epoch": 0.1, "learning_rate": 4.939361747861955e-06, "loss": 1.1359, "step": 3258 }, { "epoch": 0.1, "learning_rate": 4.9393083393268625e-06, "loss": 1.2828, "step": 3259 }, { "epoch": 0.1, "learning_rate": 4.939254907570729e-06, "loss": 1.1078, "step": 3260 }, { "epoch": 0.1, "learning_rate": 4.939201452594065e-06, "loss": 1.2144, "step": 3261 }, { "epoch": 0.1, "learning_rate": 4.939147974397377e-06, "loss": 1.083, "step": 3262 }, { "epoch": 0.1, "learning_rate": 4.939094472981175e-06, "loss": 1.1946, "step": 3263 }, { "epoch": 0.1, "learning_rate": 4.939040948345969e-06, "loss": 1.2006, "step": 3264 }, { "epoch": 0.1, "learning_rate": 4.938987400492266e-06, "loss": 1.0947, "step": 3265 }, { "epoch": 0.1, "learning_rate": 4.93893382942058e-06, "loss": 1.196, "step": 3266 }, { "epoch": 0.1, "learning_rate": 4.938880235131417e-06, "loss": 1.2109, "step": 3267 }, { "epoch": 0.1, "learning_rate": 4.938826617625289e-06, "loss": 1.1995, "step": 3268 }, { "epoch": 0.1, "learning_rate": 4.938772976902707e-06, "loss": 1.1738, "step": 3269 }, { "epoch": 0.1, "learning_rate": 4.9387193129641806e-06, "loss": 1.2452, "step": 3270 }, { "epoch": 0.1, "learning_rate": 4.93866562581022e-06, "loss": 1.1177, "step": 3271 }, { "epoch": 0.1, "learning_rate": 4.938611915441338e-06, "loss": 1.0631, "step": 3272 }, { "epoch": 0.1, "learning_rate": 4.938558181858044e-06, "loss": 1.2183, "step": 3273 }, { "epoch": 0.1, "learning_rate": 4.938504425060851e-06, "loss": 1.1512, "step": 3274 }, { "epoch": 0.1, "learning_rate": 4.938450645050271e-06, "loss": 1.1235, "step": 3275 }, { "epoch": 0.1, "learning_rate": 4.938396841826815e-06, "loss": 1.1399, "step": 3276 }, { "epoch": 0.1, "learning_rate": 4.938343015390995e-06, "loss": 1.1996, "step": 3277 }, { "epoch": 0.1, "learning_rate": 4.938289165743324e-06, "loss": 1.2607, "step": 3278 }, { "epoch": 0.1, "learning_rate": 4.938235292884314e-06, "loss": 1.16, "step": 3279 }, { "epoch": 0.1, "learning_rate": 4.93818139681448e-06, "loss": 1.1288, "step": 3280 }, { "epoch": 0.1, "learning_rate": 4.938127477534332e-06, "loss": 1.1241, "step": 3281 }, { "epoch": 0.1, "learning_rate": 4.938073535044385e-06, "loss": 1.1732, "step": 3282 }, { "epoch": 0.1, "learning_rate": 4.938019569345152e-06, "loss": 1.1703, "step": 3283 }, { "epoch": 0.1, "learning_rate": 4.937965580437147e-06, "loss": 1.0999, "step": 3284 }, { "epoch": 0.1, "learning_rate": 4.937911568320883e-06, "loss": 1.079, "step": 3285 }, { "epoch": 0.1, "learning_rate": 4.937857532996877e-06, "loss": 1.2935, "step": 3286 }, { "epoch": 0.1, "learning_rate": 4.9378034744656395e-06, "loss": 1.1606, "step": 3287 }, { "epoch": 0.1, "learning_rate": 4.9377493927276875e-06, "loss": 1.1111, "step": 3288 }, { "epoch": 0.1, "learning_rate": 4.937695287783536e-06, "loss": 1.1775, "step": 3289 }, { "epoch": 0.1, "learning_rate": 4.937641159633699e-06, "loss": 1.0975, "step": 3290 }, { "epoch": 0.1, "learning_rate": 4.937587008278691e-06, "loss": 1.1409, "step": 3291 }, { "epoch": 0.1, "learning_rate": 4.937532833719031e-06, "loss": 1.0377, "step": 3292 }, { "epoch": 0.1, "learning_rate": 4.937478635955231e-06, "loss": 1.3254, "step": 3293 }, { "epoch": 0.1, "learning_rate": 4.937424414987808e-06, "loss": 1.103, "step": 3294 }, { "epoch": 0.1, "learning_rate": 4.937370170817279e-06, "loss": 1.1545, "step": 3295 }, { "epoch": 0.1, "learning_rate": 4.9373159034441594e-06, "loss": 1.0788, "step": 3296 }, { "epoch": 0.1, "learning_rate": 4.937261612868966e-06, "loss": 1.1106, "step": 3297 }, { "epoch": 0.1, "learning_rate": 4.937207299092217e-06, "loss": 1.1582, "step": 3298 }, { "epoch": 0.1, "learning_rate": 4.937152962114428e-06, "loss": 1.2495, "step": 3299 }, { "epoch": 0.1, "learning_rate": 4.937098601936116e-06, "loss": 1.0928, "step": 3300 }, { "epoch": 0.1, "learning_rate": 4.9370442185578e-06, "loss": 1.193, "step": 3301 }, { "epoch": 0.1, "learning_rate": 4.936989811979997e-06, "loss": 1.1707, "step": 3302 }, { "epoch": 0.1, "learning_rate": 4.936935382203223e-06, "loss": 1.1005, "step": 3303 }, { "epoch": 0.1, "learning_rate": 4.936880929227998e-06, "loss": 1.1647, "step": 3304 }, { "epoch": 0.1, "learning_rate": 4.936826453054841e-06, "loss": 1.2374, "step": 3305 }, { "epoch": 0.1, "learning_rate": 4.936771953684271e-06, "loss": 1.1423, "step": 3306 }, { "epoch": 0.1, "learning_rate": 4.936717431116804e-06, "loss": 1.1233, "step": 3307 }, { "epoch": 0.1, "learning_rate": 4.936662885352961e-06, "loss": 1.1556, "step": 3308 }, { "epoch": 0.1, "learning_rate": 4.936608316393261e-06, "loss": 1.0271, "step": 3309 }, { "epoch": 0.1, "learning_rate": 4.936553724238222e-06, "loss": 1.189, "step": 3310 }, { "epoch": 0.1, "learning_rate": 4.936499108888366e-06, "loss": 1.1667, "step": 3311 }, { "epoch": 0.1, "learning_rate": 4.936444470344213e-06, "loss": 1.2149, "step": 3312 }, { "epoch": 0.1, "learning_rate": 4.936389808606281e-06, "loss": 1.1875, "step": 3313 }, { "epoch": 0.1, "learning_rate": 4.936335123675091e-06, "loss": 1.1714, "step": 3314 }, { "epoch": 0.1, "learning_rate": 4.9362804155511655e-06, "loss": 1.1285, "step": 3315 }, { "epoch": 0.1, "learning_rate": 4.936225684235022e-06, "loss": 1.2261, "step": 3316 }, { "epoch": 0.1, "learning_rate": 4.936170929727184e-06, "loss": 1.2345, "step": 3317 }, { "epoch": 0.1, "learning_rate": 4.936116152028173e-06, "loss": 1.1685, "step": 3318 }, { "epoch": 0.1, "learning_rate": 4.936061351138509e-06, "loss": 1.168, "step": 3319 }, { "epoch": 0.1, "learning_rate": 4.936006527058713e-06, "loss": 1.0818, "step": 3320 }, { "epoch": 0.1, "learning_rate": 4.935951679789309e-06, "loss": 1.1556, "step": 3321 }, { "epoch": 0.1, "learning_rate": 4.935896809330819e-06, "loss": 1.0913, "step": 3322 }, { "epoch": 0.1, "learning_rate": 4.935841915683763e-06, "loss": 1.106, "step": 3323 }, { "epoch": 0.1, "learning_rate": 4.935786998848666e-06, "loss": 1.2561, "step": 3324 }, { "epoch": 0.1, "learning_rate": 4.93573205882605e-06, "loss": 1.1467, "step": 3325 }, { "epoch": 0.1, "learning_rate": 4.935677095616438e-06, "loss": 1.1143, "step": 3326 }, { "epoch": 0.1, "learning_rate": 4.9356221092203525e-06, "loss": 1.2142, "step": 3327 }, { "epoch": 0.1, "learning_rate": 4.935567099638317e-06, "loss": 1.2629, "step": 3328 }, { "epoch": 0.1, "learning_rate": 4.935512066870857e-06, "loss": 1.1329, "step": 3329 }, { "epoch": 0.1, "learning_rate": 4.9354570109184956e-06, "loss": 1.0713, "step": 3330 }, { "epoch": 0.1, "learning_rate": 4.935401931781754e-06, "loss": 1.1721, "step": 3331 }, { "epoch": 0.1, "learning_rate": 4.9353468294611615e-06, "loss": 1.2061, "step": 3332 }, { "epoch": 0.1, "learning_rate": 4.935291703957239e-06, "loss": 1.1255, "step": 3333 }, { "epoch": 0.1, "learning_rate": 4.935236555270511e-06, "loss": 1.1553, "step": 3334 }, { "epoch": 0.1, "learning_rate": 4.935181383401506e-06, "loss": 1.2321, "step": 3335 }, { "epoch": 0.1, "learning_rate": 4.935126188350746e-06, "loss": 1.2395, "step": 3336 }, { "epoch": 0.1, "learning_rate": 4.935070970118758e-06, "loss": 1.1923, "step": 3337 }, { "epoch": 0.1, "learning_rate": 4.935015728706067e-06, "loss": 1.2054, "step": 3338 }, { "epoch": 0.1, "learning_rate": 4.934960464113199e-06, "loss": 1.1159, "step": 3339 }, { "epoch": 0.1, "learning_rate": 4.934905176340679e-06, "loss": 1.13, "step": 3340 }, { "epoch": 0.1, "learning_rate": 4.934849865389037e-06, "loss": 1.1716, "step": 3341 }, { "epoch": 0.1, "learning_rate": 4.934794531258794e-06, "loss": 1.1248, "step": 3342 }, { "epoch": 0.1, "learning_rate": 4.934739173950481e-06, "loss": 1.157, "step": 3343 }, { "epoch": 0.1, "learning_rate": 4.934683793464624e-06, "loss": 1.0784, "step": 3344 }, { "epoch": 0.1, "learning_rate": 4.93462838980175e-06, "loss": 1.2245, "step": 3345 }, { "epoch": 0.1, "learning_rate": 4.934572962962385e-06, "loss": 1.1561, "step": 3346 }, { "epoch": 0.1, "learning_rate": 4.934517512947059e-06, "loss": 1.1293, "step": 3347 }, { "epoch": 0.1, "learning_rate": 4.934462039756299e-06, "loss": 1.1183, "step": 3348 }, { "epoch": 0.1, "learning_rate": 4.9344065433906315e-06, "loss": 1.1609, "step": 3349 }, { "epoch": 0.1, "learning_rate": 4.9343510238505876e-06, "loss": 1.1381, "step": 3350 }, { "epoch": 0.1, "learning_rate": 4.934295481136694e-06, "loss": 1.1951, "step": 3351 }, { "epoch": 0.1, "learning_rate": 4.934239915249479e-06, "loss": 1.124, "step": 3352 }, { "epoch": 0.1, "learning_rate": 4.934184326189474e-06, "loss": 1.1193, "step": 3353 }, { "epoch": 0.1, "learning_rate": 4.934128713957205e-06, "loss": 1.0648, "step": 3354 }, { "epoch": 0.1, "learning_rate": 4.934073078553204e-06, "loss": 1.282, "step": 3355 }, { "epoch": 0.1, "learning_rate": 4.934017419977999e-06, "loss": 1.1743, "step": 3356 }, { "epoch": 0.1, "learning_rate": 4.9339617382321205e-06, "loss": 1.2332, "step": 3357 }, { "epoch": 0.1, "learning_rate": 4.933906033316098e-06, "loss": 1.2386, "step": 3358 }, { "epoch": 0.1, "learning_rate": 4.933850305230463e-06, "loss": 1.0814, "step": 3359 }, { "epoch": 0.1, "learning_rate": 4.933794553975746e-06, "loss": 1.2441, "step": 3360 }, { "epoch": 0.1, "learning_rate": 4.933738779552476e-06, "loss": 1.3041, "step": 3361 }, { "epoch": 0.1, "learning_rate": 4.933682981961184e-06, "loss": 1.1505, "step": 3362 }, { "epoch": 0.1, "learning_rate": 4.933627161202403e-06, "loss": 1.1757, "step": 3363 }, { "epoch": 0.1, "learning_rate": 4.933571317276664e-06, "loss": 1.1968, "step": 3364 }, { "epoch": 0.1, "learning_rate": 4.933515450184498e-06, "loss": 1.155, "step": 3365 }, { "epoch": 0.1, "learning_rate": 4.933459559926437e-06, "loss": 1.1531, "step": 3366 }, { "epoch": 0.1, "learning_rate": 4.933403646503012e-06, "loss": 1.2979, "step": 3367 }, { "epoch": 0.1, "learning_rate": 4.9333477099147575e-06, "loss": 1.2175, "step": 3368 }, { "epoch": 0.1, "learning_rate": 4.933291750162204e-06, "loss": 1.1884, "step": 3369 }, { "epoch": 0.1, "learning_rate": 4.9332357672458855e-06, "loss": 1.2201, "step": 3370 }, { "epoch": 0.1, "learning_rate": 4.933179761166334e-06, "loss": 1.111, "step": 3371 }, { "epoch": 0.1, "learning_rate": 4.9331237319240825e-06, "loss": 1.0825, "step": 3372 }, { "epoch": 0.1, "learning_rate": 4.933067679519665e-06, "loss": 1.1298, "step": 3373 }, { "epoch": 0.1, "learning_rate": 4.933011603953616e-06, "loss": 1.276, "step": 3374 }, { "epoch": 0.1, "learning_rate": 4.932955505226468e-06, "loss": 1.2413, "step": 3375 }, { "epoch": 0.1, "learning_rate": 4.932899383338755e-06, "loss": 1.1909, "step": 3376 }, { "epoch": 0.1, "learning_rate": 4.932843238291012e-06, "loss": 1.1685, "step": 3377 }, { "epoch": 0.1, "learning_rate": 4.932787070083772e-06, "loss": 1.0543, "step": 3378 }, { "epoch": 0.1, "learning_rate": 4.932730878717572e-06, "loss": 1.1591, "step": 3379 }, { "epoch": 0.1, "learning_rate": 4.9326746641929454e-06, "loss": 1.0785, "step": 3380 }, { "epoch": 0.1, "learning_rate": 4.932618426510427e-06, "loss": 1.2025, "step": 3381 }, { "epoch": 0.1, "learning_rate": 4.9325621656705535e-06, "loss": 1.2467, "step": 3382 }, { "epoch": 0.1, "learning_rate": 4.932505881673859e-06, "loss": 1.1617, "step": 3383 }, { "epoch": 0.1, "learning_rate": 4.93244957452088e-06, "loss": 1.1282, "step": 3384 }, { "epoch": 0.1, "learning_rate": 4.932393244212154e-06, "loss": 1.1138, "step": 3385 }, { "epoch": 0.1, "learning_rate": 4.932336890748215e-06, "loss": 1.1248, "step": 3386 }, { "epoch": 0.1, "learning_rate": 4.932280514129599e-06, "loss": 1.1731, "step": 3387 }, { "epoch": 0.1, "learning_rate": 4.932224114356846e-06, "loss": 1.2731, "step": 3388 }, { "epoch": 0.1, "learning_rate": 4.93216769143049e-06, "loss": 1.2245, "step": 3389 }, { "epoch": 0.1, "learning_rate": 4.932111245351069e-06, "loss": 1.1549, "step": 3390 }, { "epoch": 0.1, "learning_rate": 4.932054776119119e-06, "loss": 1.1214, "step": 3391 }, { "epoch": 0.1, "learning_rate": 4.93199828373518e-06, "loss": 1.1395, "step": 3392 }, { "epoch": 0.1, "learning_rate": 4.931941768199789e-06, "loss": 1.1882, "step": 3393 }, { "epoch": 0.1, "learning_rate": 4.931885229513483e-06, "loss": 1.2229, "step": 3394 }, { "epoch": 0.1, "learning_rate": 4.931828667676801e-06, "loss": 1.2153, "step": 3395 }, { "epoch": 0.1, "learning_rate": 4.931772082690281e-06, "loss": 1.1734, "step": 3396 }, { "epoch": 0.1, "learning_rate": 4.9317154745544624e-06, "loss": 1.1954, "step": 3397 }, { "epoch": 0.1, "learning_rate": 4.931658843269884e-06, "loss": 1.1566, "step": 3398 }, { "epoch": 0.1, "learning_rate": 4.931602188837084e-06, "loss": 1.2188, "step": 3399 }, { "epoch": 0.1, "learning_rate": 4.9315455112566024e-06, "loss": 1.1617, "step": 3400 }, { "epoch": 0.1, "learning_rate": 4.931488810528978e-06, "loss": 1.2358, "step": 3401 }, { "epoch": 0.1, "learning_rate": 4.931432086654752e-06, "loss": 1.1324, "step": 3402 }, { "epoch": 0.1, "learning_rate": 4.931375339634464e-06, "loss": 1.1686, "step": 3403 }, { "epoch": 0.1, "learning_rate": 4.931318569468652e-06, "loss": 1.0759, "step": 3404 }, { "epoch": 0.1, "learning_rate": 4.93126177615786e-06, "loss": 1.1357, "step": 3405 }, { "epoch": 0.1, "learning_rate": 4.931204959702626e-06, "loss": 1.0846, "step": 3406 }, { "epoch": 0.1, "learning_rate": 4.9311481201034915e-06, "loss": 1.1639, "step": 3407 }, { "epoch": 0.1, "learning_rate": 4.931091257360998e-06, "loss": 1.2931, "step": 3408 }, { "epoch": 0.1, "learning_rate": 4.931034371475686e-06, "loss": 1.1605, "step": 3409 }, { "epoch": 0.1, "learning_rate": 4.930977462448098e-06, "loss": 1.2118, "step": 3410 }, { "epoch": 0.1, "learning_rate": 4.930920530278776e-06, "loss": 1.1773, "step": 3411 }, { "epoch": 0.1, "learning_rate": 4.930863574968261e-06, "loss": 1.1764, "step": 3412 }, { "epoch": 0.1, "learning_rate": 4.930806596517095e-06, "loss": 1.1806, "step": 3413 }, { "epoch": 0.1, "learning_rate": 4.930749594925821e-06, "loss": 1.0569, "step": 3414 }, { "epoch": 0.1, "learning_rate": 4.930692570194983e-06, "loss": 1.0665, "step": 3415 }, { "epoch": 0.1, "learning_rate": 4.93063552232512e-06, "loss": 1.1355, "step": 3416 }, { "epoch": 0.1, "learning_rate": 4.930578451316779e-06, "loss": 1.1921, "step": 3417 }, { "epoch": 0.1, "learning_rate": 4.930521357170501e-06, "loss": 1.0889, "step": 3418 }, { "epoch": 0.1, "learning_rate": 4.930464239886832e-06, "loss": 1.1192, "step": 3419 }, { "epoch": 0.1, "learning_rate": 4.930407099466312e-06, "loss": 1.0779, "step": 3420 }, { "epoch": 0.1, "learning_rate": 4.930349935909488e-06, "loss": 1.1828, "step": 3421 }, { "epoch": 0.1, "learning_rate": 4.930292749216902e-06, "loss": 1.1103, "step": 3422 }, { "epoch": 0.1, "learning_rate": 4.930235539389101e-06, "loss": 1.1831, "step": 3423 }, { "epoch": 0.1, "learning_rate": 4.9301783064266265e-06, "loss": 1.2289, "step": 3424 }, { "epoch": 0.1, "learning_rate": 4.9301210503300264e-06, "loss": 1.0843, "step": 3425 }, { "epoch": 0.1, "learning_rate": 4.930063771099844e-06, "loss": 1.1751, "step": 3426 }, { "epoch": 0.1, "learning_rate": 4.930006468736624e-06, "loss": 1.161, "step": 3427 }, { "epoch": 0.1, "learning_rate": 4.929949143240913e-06, "loss": 1.0482, "step": 3428 }, { "epoch": 0.1, "learning_rate": 4.929891794613257e-06, "loss": 1.276, "step": 3429 }, { "epoch": 0.1, "learning_rate": 4.929834422854201e-06, "loss": 1.1403, "step": 3430 }, { "epoch": 0.1, "learning_rate": 4.929777027964292e-06, "loss": 1.1631, "step": 3431 }, { "epoch": 0.1, "learning_rate": 4.929719609944076e-06, "loss": 1.2028, "step": 3432 }, { "epoch": 0.1, "learning_rate": 4.929662168794098e-06, "loss": 1.108, "step": 3433 }, { "epoch": 0.1, "learning_rate": 4.929604704514907e-06, "loss": 1.0583, "step": 3434 }, { "epoch": 0.1, "learning_rate": 4.92954721710705e-06, "loss": 1.196, "step": 3435 }, { "epoch": 0.1, "learning_rate": 4.9294897065710735e-06, "loss": 1.2368, "step": 3436 }, { "epoch": 0.1, "learning_rate": 4.929432172907525e-06, "loss": 1.2068, "step": 3437 }, { "epoch": 0.1, "learning_rate": 4.929374616116952e-06, "loss": 1.1431, "step": 3438 }, { "epoch": 0.1, "learning_rate": 4.929317036199903e-06, "loss": 1.1902, "step": 3439 }, { "epoch": 0.1, "learning_rate": 4.929259433156926e-06, "loss": 1.1426, "step": 3440 }, { "epoch": 0.1, "learning_rate": 4.929201806988569e-06, "loss": 1.1915, "step": 3441 }, { "epoch": 0.1, "learning_rate": 4.92914415769538e-06, "loss": 1.2585, "step": 3442 }, { "epoch": 0.1, "learning_rate": 4.92908648527791e-06, "loss": 1.2078, "step": 3443 }, { "epoch": 0.1, "learning_rate": 4.929028789736705e-06, "loss": 1.3217, "step": 3444 }, { "epoch": 0.1, "learning_rate": 4.9289710710723175e-06, "loss": 1.1298, "step": 3445 }, { "epoch": 0.1, "learning_rate": 4.928913329285293e-06, "loss": 1.183, "step": 3446 }, { "epoch": 0.1, "learning_rate": 4.928855564376185e-06, "loss": 1.0795, "step": 3447 }, { "epoch": 0.1, "learning_rate": 4.928797776345542e-06, "loss": 1.0203, "step": 3448 }, { "epoch": 0.1, "learning_rate": 4.928739965193913e-06, "loss": 1.1268, "step": 3449 }, { "epoch": 0.1, "learning_rate": 4.928682130921849e-06, "loss": 1.1587, "step": 3450 }, { "epoch": 0.1, "learning_rate": 4.928624273529902e-06, "loss": 1.1679, "step": 3451 }, { "epoch": 0.1, "learning_rate": 4.92856639301862e-06, "loss": 1.0667, "step": 3452 }, { "epoch": 0.1, "learning_rate": 4.928508489388557e-06, "loss": 1.1591, "step": 3453 }, { "epoch": 0.1, "learning_rate": 4.928450562640262e-06, "loss": 1.0694, "step": 3454 }, { "epoch": 0.1, "learning_rate": 4.928392612774288e-06, "loss": 1.101, "step": 3455 }, { "epoch": 0.1, "learning_rate": 4.928334639791185e-06, "loss": 1.2019, "step": 3456 }, { "epoch": 0.1, "learning_rate": 4.928276643691507e-06, "loss": 1.1002, "step": 3457 }, { "epoch": 0.1, "learning_rate": 4.928218624475803e-06, "loss": 1.0591, "step": 3458 }, { "epoch": 0.1, "learning_rate": 4.928160582144628e-06, "loss": 1.0807, "step": 3459 }, { "epoch": 0.1, "learning_rate": 4.928102516698535e-06, "loss": 1.2179, "step": 3460 }, { "epoch": 0.1, "learning_rate": 4.928044428138075e-06, "loss": 1.1128, "step": 3461 }, { "epoch": 0.1, "learning_rate": 4.9279863164638e-06, "loss": 1.137, "step": 3462 }, { "epoch": 0.1, "learning_rate": 4.9279281816762655e-06, "loss": 1.3337, "step": 3463 }, { "epoch": 0.1, "learning_rate": 4.927870023776024e-06, "loss": 1.1205, "step": 3464 }, { "epoch": 0.1, "learning_rate": 4.927811842763629e-06, "loss": 1.0752, "step": 3465 }, { "epoch": 0.1, "learning_rate": 4.9277536386396355e-06, "loss": 1.1647, "step": 3466 }, { "epoch": 0.1, "learning_rate": 4.927695411404595e-06, "loss": 1.2195, "step": 3467 }, { "epoch": 0.1, "learning_rate": 4.927637161059065e-06, "loss": 1.2367, "step": 3468 }, { "epoch": 0.1, "learning_rate": 4.927578887603597e-06, "loss": 1.2635, "step": 3469 }, { "epoch": 0.1, "learning_rate": 4.927520591038748e-06, "loss": 1.1798, "step": 3470 }, { "epoch": 0.1, "learning_rate": 4.927462271365072e-06, "loss": 1.2372, "step": 3471 }, { "epoch": 0.1, "learning_rate": 4.927403928583124e-06, "loss": 1.1016, "step": 3472 }, { "epoch": 0.1, "learning_rate": 4.927345562693459e-06, "loss": 1.1756, "step": 3473 }, { "epoch": 0.1, "learning_rate": 4.927287173696634e-06, "loss": 1.2414, "step": 3474 }, { "epoch": 0.1, "learning_rate": 4.927228761593205e-06, "loss": 1.1159, "step": 3475 }, { "epoch": 0.1, "learning_rate": 4.927170326383726e-06, "loss": 1.2666, "step": 3476 }, { "epoch": 0.1, "learning_rate": 4.9271118680687554e-06, "loss": 1.1105, "step": 3477 }, { "epoch": 0.1, "learning_rate": 4.927053386648848e-06, "loss": 1.0909, "step": 3478 }, { "epoch": 0.1, "learning_rate": 4.9269948821245616e-06, "loss": 1.1592, "step": 3479 }, { "epoch": 0.1, "learning_rate": 4.9269363544964525e-06, "loss": 1.1574, "step": 3480 }, { "epoch": 0.1, "learning_rate": 4.9268778037650785e-06, "loss": 1.1025, "step": 3481 }, { "epoch": 0.1, "learning_rate": 4.926819229930997e-06, "loss": 1.0784, "step": 3482 }, { "epoch": 0.1, "learning_rate": 4.926760632994764e-06, "loss": 1.0974, "step": 3483 }, { "epoch": 0.1, "learning_rate": 4.92670201295694e-06, "loss": 1.2345, "step": 3484 }, { "epoch": 0.1, "learning_rate": 4.92664336981808e-06, "loss": 1.0013, "step": 3485 }, { "epoch": 0.11, "learning_rate": 4.926584703578745e-06, "loss": 1.1995, "step": 3486 }, { "epoch": 0.11, "learning_rate": 4.9265260142394925e-06, "loss": 1.2115, "step": 3487 }, { "epoch": 0.11, "learning_rate": 4.92646730180088e-06, "loss": 1.1637, "step": 3488 }, { "epoch": 0.11, "learning_rate": 4.926408566263468e-06, "loss": 1.2194, "step": 3489 }, { "epoch": 0.11, "learning_rate": 4.9263498076278146e-06, "loss": 1.157, "step": 3490 }, { "epoch": 0.11, "learning_rate": 4.92629102589448e-06, "loss": 1.0804, "step": 3491 }, { "epoch": 0.11, "learning_rate": 4.926232221064023e-06, "loss": 1.1135, "step": 3492 }, { "epoch": 0.11, "learning_rate": 4.926173393137005e-06, "loss": 1.2081, "step": 3493 }, { "epoch": 0.11, "learning_rate": 4.926114542113983e-06, "loss": 1.0988, "step": 3494 }, { "epoch": 0.11, "learning_rate": 4.926055667995521e-06, "loss": 1.2161, "step": 3495 }, { "epoch": 0.11, "learning_rate": 4.9259967707821755e-06, "loss": 1.1963, "step": 3496 }, { "epoch": 0.11, "learning_rate": 4.92593785047451e-06, "loss": 1.2029, "step": 3497 }, { "epoch": 0.11, "learning_rate": 4.925878907073085e-06, "loss": 1.1039, "step": 3498 }, { "epoch": 0.11, "learning_rate": 4.92581994057846e-06, "loss": 1.1082, "step": 3499 }, { "epoch": 0.11, "learning_rate": 4.925760950991198e-06, "loss": 1.2742, "step": 3500 }, { "epoch": 0.11, "learning_rate": 4.925701938311861e-06, "loss": 1.1989, "step": 3501 }, { "epoch": 0.11, "learning_rate": 4.925642902541009e-06, "loss": 1.1265, "step": 3502 }, { "epoch": 0.11, "learning_rate": 4.925583843679205e-06, "loss": 1.0261, "step": 3503 }, { "epoch": 0.11, "learning_rate": 4.925524761727011e-06, "loss": 1.1196, "step": 3504 }, { "epoch": 0.11, "learning_rate": 4.925465656684989e-06, "loss": 1.1654, "step": 3505 }, { "epoch": 0.11, "learning_rate": 4.925406528553702e-06, "loss": 1.1317, "step": 3506 }, { "epoch": 0.11, "learning_rate": 4.9253473773337135e-06, "loss": 1.2106, "step": 3507 }, { "epoch": 0.11, "learning_rate": 4.925288203025585e-06, "loss": 1.1327, "step": 3508 }, { "epoch": 0.11, "learning_rate": 4.9252290056298824e-06, "loss": 1.22, "step": 3509 }, { "epoch": 0.11, "learning_rate": 4.925169785147167e-06, "loss": 1.1777, "step": 3510 }, { "epoch": 0.11, "learning_rate": 4.925110541578003e-06, "loss": 1.2552, "step": 3511 }, { "epoch": 0.11, "learning_rate": 4.925051274922955e-06, "loss": 1.2845, "step": 3512 }, { "epoch": 0.11, "learning_rate": 4.924991985182587e-06, "loss": 1.1943, "step": 3513 }, { "epoch": 0.11, "learning_rate": 4.924932672357463e-06, "loss": 1.0872, "step": 3514 }, { "epoch": 0.11, "learning_rate": 4.924873336448147e-06, "loss": 1.1602, "step": 3515 }, { "epoch": 0.11, "learning_rate": 4.9248139774552066e-06, "loss": 1.1207, "step": 3516 }, { "epoch": 0.11, "learning_rate": 4.924754595379203e-06, "loss": 1.2198, "step": 3517 }, { "epoch": 0.11, "learning_rate": 4.924695190220704e-06, "loss": 1.3135, "step": 3518 }, { "epoch": 0.11, "learning_rate": 4.924635761980275e-06, "loss": 1.0959, "step": 3519 }, { "epoch": 0.11, "learning_rate": 4.924576310658482e-06, "loss": 1.1465, "step": 3520 }, { "epoch": 0.11, "learning_rate": 4.924516836255888e-06, "loss": 1.1741, "step": 3521 }, { "epoch": 0.11, "learning_rate": 4.924457338773063e-06, "loss": 1.1625, "step": 3522 }, { "epoch": 0.11, "learning_rate": 4.9243978182105725e-06, "loss": 1.1263, "step": 3523 }, { "epoch": 0.11, "learning_rate": 4.924338274568981e-06, "loss": 1.3348, "step": 3524 }, { "epoch": 0.11, "learning_rate": 4.924278707848858e-06, "loss": 1.037, "step": 3525 }, { "epoch": 0.11, "learning_rate": 4.924219118050768e-06, "loss": 1.0818, "step": 3526 }, { "epoch": 0.11, "learning_rate": 4.92415950517528e-06, "loss": 1.0959, "step": 3527 }, { "epoch": 0.11, "learning_rate": 4.9240998692229605e-06, "loss": 1.1094, "step": 3528 }, { "epoch": 0.11, "learning_rate": 4.9240402101943786e-06, "loss": 1.1663, "step": 3529 }, { "epoch": 0.11, "learning_rate": 4.923980528090101e-06, "loss": 1.207, "step": 3530 }, { "epoch": 0.11, "learning_rate": 4.923920822910696e-06, "loss": 1.1185, "step": 3531 }, { "epoch": 0.11, "learning_rate": 4.923861094656732e-06, "loss": 1.1317, "step": 3532 }, { "epoch": 0.11, "learning_rate": 4.923801343328779e-06, "loss": 1.1742, "step": 3533 }, { "epoch": 0.11, "learning_rate": 4.923741568927404e-06, "loss": 1.2179, "step": 3534 }, { "epoch": 0.11, "learning_rate": 4.923681771453176e-06, "loss": 1.2127, "step": 3535 }, { "epoch": 0.11, "learning_rate": 4.923621950906665e-06, "loss": 1.2599, "step": 3536 }, { "epoch": 0.11, "learning_rate": 4.92356210728844e-06, "loss": 0.977, "step": 3537 }, { "epoch": 0.11, "learning_rate": 4.923502240599072e-06, "loss": 1.1709, "step": 3538 }, { "epoch": 0.11, "learning_rate": 4.923442350839129e-06, "loss": 1.1567, "step": 3539 }, { "epoch": 0.11, "learning_rate": 4.923382438009182e-06, "loss": 1.1774, "step": 3540 }, { "epoch": 0.11, "learning_rate": 4.923322502109801e-06, "loss": 1.1028, "step": 3541 }, { "epoch": 0.11, "learning_rate": 4.923262543141558e-06, "loss": 1.2083, "step": 3542 }, { "epoch": 0.11, "learning_rate": 4.923202561105022e-06, "loss": 1.2598, "step": 3543 }, { "epoch": 0.11, "learning_rate": 4.923142556000765e-06, "loss": 1.0657, "step": 3544 }, { "epoch": 0.11, "learning_rate": 4.923082527829357e-06, "loss": 1.2072, "step": 3545 }, { "epoch": 0.11, "learning_rate": 4.923022476591371e-06, "loss": 1.1859, "step": 3546 }, { "epoch": 0.11, "learning_rate": 4.922962402287379e-06, "loss": 1.22, "step": 3547 }, { "epoch": 0.11, "learning_rate": 4.922902304917951e-06, "loss": 1.2292, "step": 3548 }, { "epoch": 0.11, "learning_rate": 4.9228421844836594e-06, "loss": 1.1436, "step": 3549 }, { "epoch": 0.11, "learning_rate": 4.922782040985077e-06, "loss": 1.1429, "step": 3550 }, { "epoch": 0.11, "learning_rate": 4.922721874422777e-06, "loss": 1.1891, "step": 3551 }, { "epoch": 0.11, "learning_rate": 4.922661684797332e-06, "loss": 1.047, "step": 3552 }, { "epoch": 0.11, "learning_rate": 4.922601472109313e-06, "loss": 1.0425, "step": 3553 }, { "epoch": 0.11, "learning_rate": 4.922541236359296e-06, "loss": 1.1476, "step": 3554 }, { "epoch": 0.11, "learning_rate": 4.922480977547853e-06, "loss": 1.1392, "step": 3555 }, { "epoch": 0.11, "learning_rate": 4.922420695675559e-06, "loss": 1.1694, "step": 3556 }, { "epoch": 0.11, "learning_rate": 4.9223603907429845e-06, "loss": 1.2326, "step": 3557 }, { "epoch": 0.11, "learning_rate": 4.9223000627507065e-06, "loss": 1.1963, "step": 3558 }, { "epoch": 0.11, "learning_rate": 4.922239711699299e-06, "loss": 1.0914, "step": 3559 }, { "epoch": 0.11, "learning_rate": 4.922179337589336e-06, "loss": 1.1835, "step": 3560 }, { "epoch": 0.11, "learning_rate": 4.922118940421392e-06, "loss": 1.1022, "step": 3561 }, { "epoch": 0.11, "learning_rate": 4.922058520196042e-06, "loss": 1.1613, "step": 3562 }, { "epoch": 0.11, "learning_rate": 4.921998076913861e-06, "loss": 1.3109, "step": 3563 }, { "epoch": 0.11, "learning_rate": 4.921937610575426e-06, "loss": 1.3114, "step": 3564 }, { "epoch": 0.11, "learning_rate": 4.9218771211813105e-06, "loss": 1.0707, "step": 3565 }, { "epoch": 0.11, "learning_rate": 4.9218166087320916e-06, "loss": 1.1171, "step": 3566 }, { "epoch": 0.11, "learning_rate": 4.921756073228345e-06, "loss": 1.2383, "step": 3567 }, { "epoch": 0.11, "learning_rate": 4.921695514670647e-06, "loss": 1.1896, "step": 3568 }, { "epoch": 0.11, "learning_rate": 4.9216349330595735e-06, "loss": 1.2147, "step": 3569 }, { "epoch": 0.11, "learning_rate": 4.921574328395702e-06, "loss": 1.187, "step": 3570 }, { "epoch": 0.11, "learning_rate": 4.92151370067961e-06, "loss": 1.0742, "step": 3571 }, { "epoch": 0.11, "learning_rate": 4.921453049911872e-06, "loss": 1.1075, "step": 3572 }, { "epoch": 0.11, "learning_rate": 4.921392376093068e-06, "loss": 1.1472, "step": 3573 }, { "epoch": 0.11, "learning_rate": 4.921331679223775e-06, "loss": 1.1713, "step": 3574 }, { "epoch": 0.11, "learning_rate": 4.921270959304571e-06, "loss": 1.2493, "step": 3575 }, { "epoch": 0.11, "learning_rate": 4.9212102163360334e-06, "loss": 1.1574, "step": 3576 }, { "epoch": 0.11, "learning_rate": 4.92114945031874e-06, "loss": 1.0933, "step": 3577 }, { "epoch": 0.11, "learning_rate": 4.92108866125327e-06, "loss": 1.1713, "step": 3578 }, { "epoch": 0.11, "learning_rate": 4.921027849140203e-06, "loss": 1.1281, "step": 3579 }, { "epoch": 0.11, "learning_rate": 4.920967013980116e-06, "loss": 1.1271, "step": 3580 }, { "epoch": 0.11, "learning_rate": 4.9209061557735894e-06, "loss": 1.1141, "step": 3581 }, { "epoch": 0.11, "learning_rate": 4.9208452745212015e-06, "loss": 1.097, "step": 3582 }, { "epoch": 0.11, "learning_rate": 4.920784370223533e-06, "loss": 1.1538, "step": 3583 }, { "epoch": 0.11, "learning_rate": 4.920723442881164e-06, "loss": 1.1877, "step": 3584 }, { "epoch": 0.11, "learning_rate": 4.9206624924946715e-06, "loss": 1.224, "step": 3585 }, { "epoch": 0.11, "learning_rate": 4.92060151906464e-06, "loss": 1.15, "step": 3586 }, { "epoch": 0.11, "learning_rate": 4.9205405225916466e-06, "loss": 1.1931, "step": 3587 }, { "epoch": 0.11, "learning_rate": 4.920479503076273e-06, "loss": 1.1834, "step": 3588 }, { "epoch": 0.11, "learning_rate": 4.920418460519102e-06, "loss": 1.2601, "step": 3589 }, { "epoch": 0.11, "learning_rate": 4.920357394920711e-06, "loss": 1.0837, "step": 3590 }, { "epoch": 0.11, "learning_rate": 4.920296306281684e-06, "loss": 1.2236, "step": 3591 }, { "epoch": 0.11, "learning_rate": 4.9202351946026024e-06, "loss": 1.241, "step": 3592 }, { "epoch": 0.11, "learning_rate": 4.9201740598840465e-06, "loss": 1.2531, "step": 3593 }, { "epoch": 0.11, "learning_rate": 4.920112902126599e-06, "loss": 1.0288, "step": 3594 }, { "epoch": 0.11, "learning_rate": 4.920051721330844e-06, "loss": 1.1758, "step": 3595 }, { "epoch": 0.11, "learning_rate": 4.9199905174973605e-06, "loss": 1.1531, "step": 3596 }, { "epoch": 0.11, "learning_rate": 4.9199292906267335e-06, "loss": 1.1441, "step": 3597 }, { "epoch": 0.11, "learning_rate": 4.9198680407195445e-06, "loss": 1.16, "step": 3598 }, { "epoch": 0.11, "learning_rate": 4.919806767776378e-06, "loss": 1.1661, "step": 3599 }, { "epoch": 0.11, "learning_rate": 4.919745471797815e-06, "loss": 1.1763, "step": 3600 }, { "epoch": 0.11, "learning_rate": 4.919684152784442e-06, "loss": 1.1813, "step": 3601 }, { "epoch": 0.11, "learning_rate": 4.919622810736841e-06, "loss": 1.1475, "step": 3602 }, { "epoch": 0.11, "learning_rate": 4.919561445655596e-06, "loss": 1.0714, "step": 3603 }, { "epoch": 0.11, "learning_rate": 4.919500057541292e-06, "loss": 1.2421, "step": 3604 }, { "epoch": 0.11, "learning_rate": 4.919438646394511e-06, "loss": 1.1782, "step": 3605 }, { "epoch": 0.11, "learning_rate": 4.9193772122158416e-06, "loss": 1.1196, "step": 3606 }, { "epoch": 0.11, "learning_rate": 4.919315755005864e-06, "loss": 1.1804, "step": 3607 }, { "epoch": 0.11, "learning_rate": 4.919254274765168e-06, "loss": 1.2288, "step": 3608 }, { "epoch": 0.11, "learning_rate": 4.919192771494335e-06, "loss": 1.0918, "step": 3609 }, { "epoch": 0.11, "learning_rate": 4.919131245193951e-06, "loss": 1.2185, "step": 3610 }, { "epoch": 0.11, "learning_rate": 4.919069695864604e-06, "loss": 1.2608, "step": 3611 }, { "epoch": 0.11, "learning_rate": 4.919008123506878e-06, "loss": 1.159, "step": 3612 }, { "epoch": 0.11, "learning_rate": 4.91894652812136e-06, "loss": 1.1128, "step": 3613 }, { "epoch": 0.11, "learning_rate": 4.918884909708637e-06, "loss": 1.1409, "step": 3614 }, { "epoch": 0.11, "learning_rate": 4.9188232682692925e-06, "loss": 1.1243, "step": 3615 }, { "epoch": 0.11, "learning_rate": 4.918761603803917e-06, "loss": 1.1956, "step": 3616 }, { "epoch": 0.11, "learning_rate": 4.918699916313096e-06, "loss": 1.1477, "step": 3617 }, { "epoch": 0.11, "learning_rate": 4.918638205797416e-06, "loss": 1.2828, "step": 3618 }, { "epoch": 0.11, "learning_rate": 4.918576472257465e-06, "loss": 1.1533, "step": 3619 }, { "epoch": 0.11, "learning_rate": 4.9185147156938315e-06, "loss": 1.1677, "step": 3620 }, { "epoch": 0.11, "learning_rate": 4.918452936107102e-06, "loss": 1.1226, "step": 3621 }, { "epoch": 0.11, "learning_rate": 4.918391133497867e-06, "loss": 1.0166, "step": 3622 }, { "epoch": 0.11, "learning_rate": 4.918329307866711e-06, "loss": 1.1672, "step": 3623 }, { "epoch": 0.11, "learning_rate": 4.9182674592142254e-06, "loss": 1.2058, "step": 3624 }, { "epoch": 0.11, "learning_rate": 4.918205587540998e-06, "loss": 1.2291, "step": 3625 }, { "epoch": 0.11, "learning_rate": 4.918143692847619e-06, "loss": 1.2146, "step": 3626 }, { "epoch": 0.11, "learning_rate": 4.918081775134676e-06, "loss": 1.1763, "step": 3627 }, { "epoch": 0.11, "learning_rate": 4.91801983440276e-06, "loss": 1.076, "step": 3628 }, { "epoch": 0.11, "learning_rate": 4.9179578706524585e-06, "loss": 1.0945, "step": 3629 }, { "epoch": 0.11, "learning_rate": 4.917895883884363e-06, "loss": 1.2259, "step": 3630 }, { "epoch": 0.11, "learning_rate": 4.917833874099063e-06, "loss": 1.2255, "step": 3631 }, { "epoch": 0.11, "learning_rate": 4.917771841297149e-06, "loss": 1.163, "step": 3632 }, { "epoch": 0.11, "learning_rate": 4.917709785479212e-06, "loss": 1.2288, "step": 3633 }, { "epoch": 0.11, "learning_rate": 4.917647706645842e-06, "loss": 1.1825, "step": 3634 }, { "epoch": 0.11, "learning_rate": 4.91758560479763e-06, "loss": 1.2191, "step": 3635 }, { "epoch": 0.11, "learning_rate": 4.917523479935168e-06, "loss": 1.1838, "step": 3636 }, { "epoch": 0.11, "learning_rate": 4.917461332059046e-06, "loss": 1.005, "step": 3637 }, { "epoch": 0.11, "learning_rate": 4.917399161169857e-06, "loss": 1.2609, "step": 3638 }, { "epoch": 0.11, "learning_rate": 4.917336967268192e-06, "loss": 1.1004, "step": 3639 }, { "epoch": 0.11, "learning_rate": 4.917274750354644e-06, "loss": 1.1979, "step": 3640 }, { "epoch": 0.11, "learning_rate": 4.917212510429803e-06, "loss": 1.0795, "step": 3641 }, { "epoch": 0.11, "learning_rate": 4.917150247494265e-06, "loss": 1.1809, "step": 3642 }, { "epoch": 0.11, "learning_rate": 4.917087961548619e-06, "loss": 1.2954, "step": 3643 }, { "epoch": 0.11, "learning_rate": 4.91702565259346e-06, "loss": 1.226, "step": 3644 }, { "epoch": 0.11, "learning_rate": 4.916963320629382e-06, "loss": 1.1742, "step": 3645 }, { "epoch": 0.11, "learning_rate": 4.916900965656977e-06, "loss": 1.075, "step": 3646 }, { "epoch": 0.11, "learning_rate": 4.916838587676837e-06, "loss": 1.0941, "step": 3647 }, { "epoch": 0.11, "learning_rate": 4.91677618668956e-06, "loss": 1.1373, "step": 3648 }, { "epoch": 0.11, "learning_rate": 4.916713762695736e-06, "loss": 1.1924, "step": 3649 }, { "epoch": 0.11, "learning_rate": 4.916651315695962e-06, "loss": 1.189, "step": 3650 }, { "epoch": 0.11, "learning_rate": 4.916588845690831e-06, "loss": 1.0974, "step": 3651 }, { "epoch": 0.11, "learning_rate": 4.916526352680938e-06, "loss": 1.1963, "step": 3652 }, { "epoch": 0.11, "learning_rate": 4.916463836666878e-06, "loss": 1.0002, "step": 3653 }, { "epoch": 0.11, "learning_rate": 4.916401297649246e-06, "loss": 1.142, "step": 3654 }, { "epoch": 0.11, "learning_rate": 4.916338735628638e-06, "loss": 1.2803, "step": 3655 }, { "epoch": 0.11, "learning_rate": 4.916276150605648e-06, "loss": 1.0876, "step": 3656 }, { "epoch": 0.11, "learning_rate": 4.916213542580873e-06, "loss": 1.1625, "step": 3657 }, { "epoch": 0.11, "learning_rate": 4.916150911554909e-06, "loss": 1.252, "step": 3658 }, { "epoch": 0.11, "learning_rate": 4.916088257528352e-06, "loss": 1.213, "step": 3659 }, { "epoch": 0.11, "learning_rate": 4.9160255805017985e-06, "loss": 1.2091, "step": 3660 }, { "epoch": 0.11, "learning_rate": 4.915962880475845e-06, "loss": 1.1509, "step": 3661 }, { "epoch": 0.11, "learning_rate": 4.915900157451089e-06, "loss": 1.1786, "step": 3662 }, { "epoch": 0.11, "learning_rate": 4.915837411428126e-06, "loss": 1.08, "step": 3663 }, { "epoch": 0.11, "learning_rate": 4.9157746424075555e-06, "loss": 1.1235, "step": 3664 }, { "epoch": 0.11, "learning_rate": 4.915711850389973e-06, "loss": 1.1707, "step": 3665 }, { "epoch": 0.11, "learning_rate": 4.915649035375977e-06, "loss": 1.0886, "step": 3666 }, { "epoch": 0.11, "learning_rate": 4.915586197366166e-06, "loss": 1.231, "step": 3667 }, { "epoch": 0.11, "learning_rate": 4.915523336361137e-06, "loss": 1.1635, "step": 3668 }, { "epoch": 0.11, "learning_rate": 4.915460452361491e-06, "loss": 1.2129, "step": 3669 }, { "epoch": 0.11, "learning_rate": 4.9153975453678235e-06, "loss": 1.1391, "step": 3670 }, { "epoch": 0.11, "learning_rate": 4.915334615380735e-06, "loss": 1.1783, "step": 3671 }, { "epoch": 0.11, "learning_rate": 4.915271662400824e-06, "loss": 1.2493, "step": 3672 }, { "epoch": 0.11, "learning_rate": 4.9152086864286905e-06, "loss": 1.1921, "step": 3673 }, { "epoch": 0.11, "learning_rate": 4.915145687464933e-06, "loss": 1.0383, "step": 3674 }, { "epoch": 0.11, "learning_rate": 4.915082665510152e-06, "loss": 1.1871, "step": 3675 }, { "epoch": 0.11, "learning_rate": 4.915019620564947e-06, "loss": 1.1065, "step": 3676 }, { "epoch": 0.11, "learning_rate": 4.914956552629918e-06, "loss": 1.1786, "step": 3677 }, { "epoch": 0.11, "learning_rate": 4.914893461705667e-06, "loss": 1.056, "step": 3678 }, { "epoch": 0.11, "learning_rate": 4.9148303477927915e-06, "loss": 1.1888, "step": 3679 }, { "epoch": 0.11, "learning_rate": 4.914767210891895e-06, "loss": 1.1558, "step": 3680 }, { "epoch": 0.11, "learning_rate": 4.914704051003578e-06, "loss": 1.175, "step": 3681 }, { "epoch": 0.11, "learning_rate": 4.914640868128441e-06, "loss": 1.0614, "step": 3682 }, { "epoch": 0.11, "learning_rate": 4.914577662267086e-06, "loss": 1.2244, "step": 3683 }, { "epoch": 0.11, "learning_rate": 4.914514433420114e-06, "loss": 1.1647, "step": 3684 }, { "epoch": 0.11, "learning_rate": 4.914451181588128e-06, "loss": 1.1341, "step": 3685 }, { "epoch": 0.11, "learning_rate": 4.914387906771729e-06, "loss": 1.2634, "step": 3686 }, { "epoch": 0.11, "learning_rate": 4.914324608971521e-06, "loss": 1.1183, "step": 3687 }, { "epoch": 0.11, "learning_rate": 4.914261288188105e-06, "loss": 1.2073, "step": 3688 }, { "epoch": 0.11, "learning_rate": 4.914197944422085e-06, "loss": 1.1934, "step": 3689 }, { "epoch": 0.11, "learning_rate": 4.914134577674062e-06, "loss": 1.1349, "step": 3690 }, { "epoch": 0.11, "learning_rate": 4.914071187944641e-06, "loss": 1.1729, "step": 3691 }, { "epoch": 0.11, "learning_rate": 4.914007775234425e-06, "loss": 1.1388, "step": 3692 }, { "epoch": 0.11, "learning_rate": 4.913944339544018e-06, "loss": 1.2302, "step": 3693 }, { "epoch": 0.11, "learning_rate": 4.9138808808740226e-06, "loss": 1.1105, "step": 3694 }, { "epoch": 0.11, "learning_rate": 4.9138173992250435e-06, "loss": 1.1605, "step": 3695 }, { "epoch": 0.11, "learning_rate": 4.913753894597687e-06, "loss": 1.1894, "step": 3696 }, { "epoch": 0.11, "learning_rate": 4.913690366992554e-06, "loss": 1.1411, "step": 3697 }, { "epoch": 0.11, "learning_rate": 4.9136268164102525e-06, "loss": 1.1094, "step": 3698 }, { "epoch": 0.11, "learning_rate": 4.913563242851386e-06, "loss": 1.3678, "step": 3699 }, { "epoch": 0.11, "learning_rate": 4.913499646316559e-06, "loss": 1.1576, "step": 3700 }, { "epoch": 0.11, "learning_rate": 4.913436026806378e-06, "loss": 1.1562, "step": 3701 }, { "epoch": 0.11, "learning_rate": 4.91337238432145e-06, "loss": 1.1625, "step": 3702 }, { "epoch": 0.11, "learning_rate": 4.9133087188623775e-06, "loss": 1.091, "step": 3703 }, { "epoch": 0.11, "learning_rate": 4.913245030429768e-06, "loss": 1.1547, "step": 3704 }, { "epoch": 0.11, "learning_rate": 4.91318131902423e-06, "loss": 1.0096, "step": 3705 }, { "epoch": 0.11, "learning_rate": 4.9131175846463665e-06, "loss": 1.1373, "step": 3706 }, { "epoch": 0.11, "learning_rate": 4.913053827296787e-06, "loss": 1.0222, "step": 3707 }, { "epoch": 0.11, "learning_rate": 4.912990046976096e-06, "loss": 1.1248, "step": 3708 }, { "epoch": 0.11, "learning_rate": 4.912926243684902e-06, "loss": 1.0232, "step": 3709 }, { "epoch": 0.11, "learning_rate": 4.9128624174238125e-06, "loss": 1.2214, "step": 3710 }, { "epoch": 0.11, "learning_rate": 4.912798568193435e-06, "loss": 1.1442, "step": 3711 }, { "epoch": 0.11, "learning_rate": 4.912734695994377e-06, "loss": 1.0867, "step": 3712 }, { "epoch": 0.11, "learning_rate": 4.9126708008272475e-06, "loss": 1.0908, "step": 3713 }, { "epoch": 0.11, "learning_rate": 4.912606882692652e-06, "loss": 1.2321, "step": 3714 }, { "epoch": 0.11, "learning_rate": 4.9125429415912025e-06, "loss": 1.1205, "step": 3715 }, { "epoch": 0.11, "learning_rate": 4.912478977523506e-06, "loss": 1.1006, "step": 3716 }, { "epoch": 0.11, "learning_rate": 4.912414990490171e-06, "loss": 1.1176, "step": 3717 }, { "epoch": 0.11, "learning_rate": 4.912350980491808e-06, "loss": 1.2316, "step": 3718 }, { "epoch": 0.11, "learning_rate": 4.912286947529024e-06, "loss": 1.2239, "step": 3719 }, { "epoch": 0.11, "learning_rate": 4.912222891602431e-06, "loss": 1.1663, "step": 3720 }, { "epoch": 0.11, "learning_rate": 4.912158812712639e-06, "loss": 1.183, "step": 3721 }, { "epoch": 0.11, "learning_rate": 4.912094710860256e-06, "loss": 1.0963, "step": 3722 }, { "epoch": 0.11, "learning_rate": 4.912030586045893e-06, "loss": 1.1252, "step": 3723 }, { "epoch": 0.11, "learning_rate": 4.91196643827016e-06, "loss": 1.1432, "step": 3724 }, { "epoch": 0.11, "learning_rate": 4.911902267533668e-06, "loss": 1.205, "step": 3725 }, { "epoch": 0.11, "learning_rate": 4.911838073837028e-06, "loss": 1.119, "step": 3726 }, { "epoch": 0.11, "learning_rate": 4.911773857180852e-06, "loss": 1.1483, "step": 3727 }, { "epoch": 0.11, "learning_rate": 4.91170961756575e-06, "loss": 1.0544, "step": 3728 }, { "epoch": 0.11, "learning_rate": 4.9116453549923335e-06, "loss": 1.1783, "step": 3729 }, { "epoch": 0.11, "learning_rate": 4.911581069461216e-06, "loss": 1.1866, "step": 3730 }, { "epoch": 0.11, "learning_rate": 4.911516760973007e-06, "loss": 1.0441, "step": 3731 }, { "epoch": 0.11, "learning_rate": 4.91145242952832e-06, "loss": 1.1967, "step": 3732 }, { "epoch": 0.11, "learning_rate": 4.9113880751277674e-06, "loss": 1.1449, "step": 3733 }, { "epoch": 0.11, "learning_rate": 4.911323697771962e-06, "loss": 1.1879, "step": 3734 }, { "epoch": 0.11, "learning_rate": 4.911259297461516e-06, "loss": 1.117, "step": 3735 }, { "epoch": 0.11, "learning_rate": 4.911194874197043e-06, "loss": 1.21, "step": 3736 }, { "epoch": 0.11, "learning_rate": 4.911130427979156e-06, "loss": 1.0952, "step": 3737 }, { "epoch": 0.11, "learning_rate": 4.911065958808468e-06, "loss": 1.1127, "step": 3738 }, { "epoch": 0.11, "learning_rate": 4.9110014666855945e-06, "loss": 1.1763, "step": 3739 }, { "epoch": 0.11, "learning_rate": 4.910936951611147e-06, "loss": 1.1679, "step": 3740 }, { "epoch": 0.11, "learning_rate": 4.9108724135857415e-06, "loss": 1.182, "step": 3741 }, { "epoch": 0.11, "learning_rate": 4.910807852609991e-06, "loss": 1.195, "step": 3742 }, { "epoch": 0.11, "learning_rate": 4.910743268684513e-06, "loss": 1.2163, "step": 3743 }, { "epoch": 0.11, "learning_rate": 4.9106786618099175e-06, "loss": 1.2831, "step": 3744 }, { "epoch": 0.11, "learning_rate": 4.910614031986824e-06, "loss": 1.142, "step": 3745 }, { "epoch": 0.11, "learning_rate": 4.910549379215845e-06, "loss": 1.0944, "step": 3746 }, { "epoch": 0.11, "learning_rate": 4.910484703497597e-06, "loss": 1.1822, "step": 3747 }, { "epoch": 0.11, "learning_rate": 4.910420004832696e-06, "loss": 1.2083, "step": 3748 }, { "epoch": 0.11, "learning_rate": 4.910355283221756e-06, "loss": 1.1741, "step": 3749 }, { "epoch": 0.11, "learning_rate": 4.910290538665396e-06, "loss": 1.1692, "step": 3750 }, { "epoch": 0.11, "learning_rate": 4.910225771164231e-06, "loss": 1.1307, "step": 3751 }, { "epoch": 0.11, "learning_rate": 4.910160980718876e-06, "loss": 1.1163, "step": 3752 }, { "epoch": 0.11, "learning_rate": 4.910096167329951e-06, "loss": 1.2538, "step": 3753 }, { "epoch": 0.11, "learning_rate": 4.9100313309980694e-06, "loss": 1.2217, "step": 3754 }, { "epoch": 0.11, "learning_rate": 4.909966471723852e-06, "loss": 1.1719, "step": 3755 }, { "epoch": 0.11, "learning_rate": 4.909901589507914e-06, "loss": 1.2068, "step": 3756 }, { "epoch": 0.11, "learning_rate": 4.909836684350873e-06, "loss": 1.167, "step": 3757 }, { "epoch": 0.11, "learning_rate": 4.909771756253347e-06, "loss": 1.0681, "step": 3758 }, { "epoch": 0.11, "learning_rate": 4.909706805215956e-06, "loss": 1.1189, "step": 3759 }, { "epoch": 0.11, "learning_rate": 4.909641831239316e-06, "loss": 1.1713, "step": 3760 }, { "epoch": 0.11, "learning_rate": 4.909576834324046e-06, "loss": 1.2914, "step": 3761 }, { "epoch": 0.11, "learning_rate": 4.909511814470765e-06, "loss": 1.2556, "step": 3762 }, { "epoch": 0.11, "learning_rate": 4.909446771680092e-06, "loss": 1.1819, "step": 3763 }, { "epoch": 0.11, "learning_rate": 4.909381705952646e-06, "loss": 1.2318, "step": 3764 }, { "epoch": 0.11, "learning_rate": 4.909316617289047e-06, "loss": 1.1026, "step": 3765 }, { "epoch": 0.11, "learning_rate": 4.909251505689915e-06, "loss": 1.239, "step": 3766 }, { "epoch": 0.11, "learning_rate": 4.909186371155868e-06, "loss": 1.2426, "step": 3767 }, { "epoch": 0.11, "learning_rate": 4.909121213687526e-06, "loss": 1.1406, "step": 3768 }, { "epoch": 0.11, "learning_rate": 4.909056033285512e-06, "loss": 1.0969, "step": 3769 }, { "epoch": 0.11, "learning_rate": 4.908990829950444e-06, "loss": 1.1278, "step": 3770 }, { "epoch": 0.11, "learning_rate": 4.9089256036829435e-06, "loss": 1.0952, "step": 3771 }, { "epoch": 0.11, "learning_rate": 4.908860354483632e-06, "loss": 1.0869, "step": 3772 }, { "epoch": 0.11, "learning_rate": 4.90879508235313e-06, "loss": 1.27, "step": 3773 }, { "epoch": 0.11, "learning_rate": 4.908729787292058e-06, "loss": 1.2869, "step": 3774 }, { "epoch": 0.11, "learning_rate": 4.90866446930104e-06, "loss": 1.2227, "step": 3775 }, { "epoch": 0.11, "learning_rate": 4.908599128380696e-06, "loss": 1.2103, "step": 3776 }, { "epoch": 0.11, "learning_rate": 4.908533764531647e-06, "loss": 1.1744, "step": 3777 }, { "epoch": 0.11, "learning_rate": 4.908468377754517e-06, "loss": 1.1023, "step": 3778 }, { "epoch": 0.11, "learning_rate": 4.908402968049929e-06, "loss": 1.2651, "step": 3779 }, { "epoch": 0.11, "learning_rate": 4.908337535418503e-06, "loss": 1.2577, "step": 3780 }, { "epoch": 0.11, "learning_rate": 4.908272079860865e-06, "loss": 1.2133, "step": 3781 }, { "epoch": 0.11, "learning_rate": 4.9082066013776365e-06, "loss": 1.1825, "step": 3782 }, { "epoch": 0.11, "learning_rate": 4.908141099969441e-06, "loss": 1.0724, "step": 3783 }, { "epoch": 0.11, "learning_rate": 4.9080755756369015e-06, "loss": 1.1942, "step": 3784 }, { "epoch": 0.11, "learning_rate": 4.908010028380643e-06, "loss": 1.1433, "step": 3785 }, { "epoch": 0.11, "learning_rate": 4.907944458201288e-06, "loss": 1.2177, "step": 3786 }, { "epoch": 0.11, "learning_rate": 4.907878865099462e-06, "loss": 1.2366, "step": 3787 }, { "epoch": 0.11, "learning_rate": 4.907813249075788e-06, "loss": 0.9567, "step": 3788 }, { "epoch": 0.11, "learning_rate": 4.907747610130893e-06, "loss": 1.0644, "step": 3789 }, { "epoch": 0.11, "learning_rate": 4.907681948265399e-06, "loss": 1.1862, "step": 3790 }, { "epoch": 0.11, "learning_rate": 4.907616263479933e-06, "loss": 1.1389, "step": 3791 }, { "epoch": 0.11, "learning_rate": 4.90755055577512e-06, "loss": 1.2206, "step": 3792 }, { "epoch": 0.11, "learning_rate": 4.907484825151585e-06, "loss": 1.3061, "step": 3793 }, { "epoch": 0.11, "learning_rate": 4.9074190716099536e-06, "loss": 1.2146, "step": 3794 }, { "epoch": 0.11, "learning_rate": 4.907353295150853e-06, "loss": 1.0967, "step": 3795 }, { "epoch": 0.11, "learning_rate": 4.907287495774907e-06, "loss": 1.1248, "step": 3796 }, { "epoch": 0.11, "learning_rate": 4.907221673482745e-06, "loss": 1.1443, "step": 3797 }, { "epoch": 0.11, "learning_rate": 4.907155828274991e-06, "loss": 1.1216, "step": 3798 }, { "epoch": 0.11, "learning_rate": 4.907089960152273e-06, "loss": 1.2531, "step": 3799 }, { "epoch": 0.11, "learning_rate": 4.907024069115218e-06, "loss": 1.2109, "step": 3800 }, { "epoch": 0.11, "learning_rate": 4.906958155164453e-06, "loss": 1.1774, "step": 3801 }, { "epoch": 0.11, "learning_rate": 4.906892218300606e-06, "loss": 1.0862, "step": 3802 }, { "epoch": 0.11, "learning_rate": 4.906826258524304e-06, "loss": 1.1412, "step": 3803 }, { "epoch": 0.11, "learning_rate": 4.906760275836175e-06, "loss": 1.0826, "step": 3804 }, { "epoch": 0.11, "learning_rate": 4.906694270236848e-06, "loss": 1.2266, "step": 3805 }, { "epoch": 0.11, "learning_rate": 4.906628241726949e-06, "loss": 1.222, "step": 3806 }, { "epoch": 0.11, "learning_rate": 4.90656219030711e-06, "loss": 1.2038, "step": 3807 }, { "epoch": 0.11, "learning_rate": 4.906496115977957e-06, "loss": 1.1667, "step": 3808 }, { "epoch": 0.11, "learning_rate": 4.90643001874012e-06, "loss": 1.2168, "step": 3809 }, { "epoch": 0.11, "learning_rate": 4.9063638985942295e-06, "loss": 1.1287, "step": 3810 }, { "epoch": 0.11, "learning_rate": 4.906297755540912e-06, "loss": 1.1664, "step": 3811 }, { "epoch": 0.11, "learning_rate": 4.9062315895808e-06, "loss": 1.1401, "step": 3812 }, { "epoch": 0.11, "learning_rate": 4.906165400714521e-06, "loss": 1.1536, "step": 3813 }, { "epoch": 0.11, "learning_rate": 4.9060991889427065e-06, "loss": 1.1313, "step": 3814 }, { "epoch": 0.11, "learning_rate": 4.906032954265987e-06, "loss": 1.0797, "step": 3815 }, { "epoch": 0.11, "learning_rate": 4.905966696684993e-06, "loss": 1.1058, "step": 3816 }, { "epoch": 0.11, "learning_rate": 4.905900416200354e-06, "loss": 1.1215, "step": 3817 }, { "epoch": 0.12, "learning_rate": 4.905834112812702e-06, "loss": 1.2072, "step": 3818 }, { "epoch": 0.12, "learning_rate": 4.905767786522668e-06, "loss": 1.1108, "step": 3819 }, { "epoch": 0.12, "learning_rate": 4.905701437330883e-06, "loss": 1.1523, "step": 3820 }, { "epoch": 0.12, "learning_rate": 4.9056350652379795e-06, "loss": 1.2406, "step": 3821 }, { "epoch": 0.12, "learning_rate": 4.9055686702445885e-06, "loss": 1.1937, "step": 3822 }, { "epoch": 0.12, "learning_rate": 4.905502252351342e-06, "loss": 1.1006, "step": 3823 }, { "epoch": 0.12, "learning_rate": 4.905435811558873e-06, "loss": 1.2583, "step": 3824 }, { "epoch": 0.12, "learning_rate": 4.905369347867814e-06, "loss": 1.1266, "step": 3825 }, { "epoch": 0.12, "learning_rate": 4.905302861278795e-06, "loss": 1.1691, "step": 3826 }, { "epoch": 0.12, "learning_rate": 4.905236351792454e-06, "loss": 1.1618, "step": 3827 }, { "epoch": 0.12, "learning_rate": 4.90516981940942e-06, "loss": 1.0877, "step": 3828 }, { "epoch": 0.12, "learning_rate": 4.905103264130328e-06, "loss": 1.1547, "step": 3829 }, { "epoch": 0.12, "learning_rate": 4.905036685955811e-06, "loss": 1.1295, "step": 3830 }, { "epoch": 0.12, "learning_rate": 4.904970084886504e-06, "loss": 1.123, "step": 3831 }, { "epoch": 0.12, "learning_rate": 4.904903460923039e-06, "loss": 1.1128, "step": 3832 }, { "epoch": 0.12, "learning_rate": 4.904836814066052e-06, "loss": 1.0942, "step": 3833 }, { "epoch": 0.12, "learning_rate": 4.9047701443161755e-06, "loss": 1.0676, "step": 3834 }, { "epoch": 0.12, "learning_rate": 4.9047034516740465e-06, "loss": 1.1337, "step": 3835 }, { "epoch": 0.12, "learning_rate": 4.904636736140298e-06, "loss": 1.2157, "step": 3836 }, { "epoch": 0.12, "learning_rate": 4.904569997715567e-06, "loss": 1.1801, "step": 3837 }, { "epoch": 0.12, "learning_rate": 4.904503236400487e-06, "loss": 1.1072, "step": 3838 }, { "epoch": 0.12, "learning_rate": 4.904436452195695e-06, "loss": 1.2249, "step": 3839 }, { "epoch": 0.12, "learning_rate": 4.904369645101824e-06, "loss": 1.0626, "step": 3840 }, { "epoch": 0.12, "learning_rate": 4.904302815119514e-06, "loss": 1.2014, "step": 3841 }, { "epoch": 0.12, "learning_rate": 4.904235962249398e-06, "loss": 1.1893, "step": 3842 }, { "epoch": 0.12, "learning_rate": 4.9041690864921146e-06, "loss": 1.1059, "step": 3843 }, { "epoch": 0.12, "learning_rate": 4.904102187848299e-06, "loss": 1.2748, "step": 3844 }, { "epoch": 0.12, "learning_rate": 4.9040352663185875e-06, "loss": 1.0477, "step": 3845 }, { "epoch": 0.12, "learning_rate": 4.9039683219036196e-06, "loss": 1.1299, "step": 3846 }, { "epoch": 0.12, "learning_rate": 4.90390135460403e-06, "loss": 1.1935, "step": 3847 }, { "epoch": 0.12, "learning_rate": 4.903834364420457e-06, "loss": 1.1942, "step": 3848 }, { "epoch": 0.12, "learning_rate": 4.903767351353539e-06, "loss": 1.1207, "step": 3849 }, { "epoch": 0.12, "learning_rate": 4.903700315403914e-06, "loss": 1.129, "step": 3850 }, { "epoch": 0.12, "learning_rate": 4.903633256572219e-06, "loss": 1.1104, "step": 3851 }, { "epoch": 0.12, "learning_rate": 4.903566174859093e-06, "loss": 1.1812, "step": 3852 }, { "epoch": 0.12, "learning_rate": 4.9034990702651755e-06, "loss": 1.0261, "step": 3853 }, { "epoch": 0.12, "learning_rate": 4.903431942791104e-06, "loss": 1.1824, "step": 3854 }, { "epoch": 0.12, "learning_rate": 4.903364792437518e-06, "loss": 1.2101, "step": 3855 }, { "epoch": 0.12, "learning_rate": 4.903297619205057e-06, "loss": 1.0961, "step": 3856 }, { "epoch": 0.12, "learning_rate": 4.9032304230943585e-06, "loss": 1.0741, "step": 3857 }, { "epoch": 0.12, "learning_rate": 4.903163204106065e-06, "loss": 1.1062, "step": 3858 }, { "epoch": 0.12, "learning_rate": 4.903095962240815e-06, "loss": 1.1115, "step": 3859 }, { "epoch": 0.12, "learning_rate": 4.903028697499249e-06, "loss": 1.311, "step": 3860 }, { "epoch": 0.12, "learning_rate": 4.902961409882007e-06, "loss": 1.145, "step": 3861 }, { "epoch": 0.12, "learning_rate": 4.90289409938973e-06, "loss": 1.2061, "step": 3862 }, { "epoch": 0.12, "learning_rate": 4.902826766023058e-06, "loss": 1.2921, "step": 3863 }, { "epoch": 0.12, "learning_rate": 4.9027594097826325e-06, "loss": 1.1395, "step": 3864 }, { "epoch": 0.12, "learning_rate": 4.902692030669095e-06, "loss": 1.0542, "step": 3865 }, { "epoch": 0.12, "learning_rate": 4.902624628683086e-06, "loss": 1.1779, "step": 3866 }, { "epoch": 0.12, "learning_rate": 4.902557203825247e-06, "loss": 1.2233, "step": 3867 }, { "epoch": 0.12, "learning_rate": 4.902489756096223e-06, "loss": 1.2007, "step": 3868 }, { "epoch": 0.12, "learning_rate": 4.902422285496652e-06, "loss": 1.0929, "step": 3869 }, { "epoch": 0.12, "learning_rate": 4.902354792027177e-06, "loss": 1.1567, "step": 3870 }, { "epoch": 0.12, "learning_rate": 4.902287275688443e-06, "loss": 1.1915, "step": 3871 }, { "epoch": 0.12, "learning_rate": 4.902219736481091e-06, "loss": 1.1322, "step": 3872 }, { "epoch": 0.12, "learning_rate": 4.902152174405763e-06, "loss": 1.1276, "step": 3873 }, { "epoch": 0.12, "learning_rate": 4.902084589463104e-06, "loss": 1.0775, "step": 3874 }, { "epoch": 0.12, "learning_rate": 4.9020169816537565e-06, "loss": 1.1167, "step": 3875 }, { "epoch": 0.12, "learning_rate": 4.901949350978363e-06, "loss": 1.1594, "step": 3876 }, { "epoch": 0.12, "learning_rate": 4.901881697437571e-06, "loss": 1.1308, "step": 3877 }, { "epoch": 0.12, "learning_rate": 4.90181402103202e-06, "loss": 1.212, "step": 3878 }, { "epoch": 0.12, "learning_rate": 4.9017463217623566e-06, "loss": 1.2384, "step": 3879 }, { "epoch": 0.12, "learning_rate": 4.901678599629225e-06, "loss": 1.1331, "step": 3880 }, { "epoch": 0.12, "learning_rate": 4.90161085463327e-06, "loss": 1.1794, "step": 3881 }, { "epoch": 0.12, "learning_rate": 4.901543086775137e-06, "loss": 1.167, "step": 3882 }, { "epoch": 0.12, "learning_rate": 4.901475296055469e-06, "loss": 1.139, "step": 3883 }, { "epoch": 0.12, "learning_rate": 4.901407482474914e-06, "loss": 1.1216, "step": 3884 }, { "epoch": 0.12, "learning_rate": 4.901339646034116e-06, "loss": 1.0746, "step": 3885 }, { "epoch": 0.12, "learning_rate": 4.901271786733721e-06, "loss": 1.1595, "step": 3886 }, { "epoch": 0.12, "learning_rate": 4.901203904574374e-06, "loss": 1.2838, "step": 3887 }, { "epoch": 0.12, "learning_rate": 4.9011359995567245e-06, "loss": 1.1126, "step": 3888 }, { "epoch": 0.12, "learning_rate": 4.9010680716814154e-06, "loss": 1.2271, "step": 3889 }, { "epoch": 0.12, "learning_rate": 4.901000120949094e-06, "loss": 1.1295, "step": 3890 }, { "epoch": 0.12, "learning_rate": 4.900932147360409e-06, "loss": 1.0453, "step": 3891 }, { "epoch": 0.12, "learning_rate": 4.900864150916006e-06, "loss": 1.1868, "step": 3892 }, { "epoch": 0.12, "learning_rate": 4.900796131616532e-06, "loss": 1.1673, "step": 3893 }, { "epoch": 0.12, "learning_rate": 4.900728089462636e-06, "loss": 1.1267, "step": 3894 }, { "epoch": 0.12, "learning_rate": 4.900660024454964e-06, "loss": 1.1162, "step": 3895 }, { "epoch": 0.12, "learning_rate": 4.900591936594165e-06, "loss": 1.178, "step": 3896 }, { "epoch": 0.12, "learning_rate": 4.9005238258808874e-06, "loss": 1.1284, "step": 3897 }, { "epoch": 0.12, "learning_rate": 4.900455692315779e-06, "loss": 1.1567, "step": 3898 }, { "epoch": 0.12, "learning_rate": 4.900387535899488e-06, "loss": 1.1257, "step": 3899 }, { "epoch": 0.12, "learning_rate": 4.900319356632663e-06, "loss": 1.2068, "step": 3900 }, { "epoch": 0.12, "learning_rate": 4.900251154515956e-06, "loss": 1.1018, "step": 3901 }, { "epoch": 0.12, "learning_rate": 4.900182929550013e-06, "loss": 1.1716, "step": 3902 }, { "epoch": 0.12, "learning_rate": 4.900114681735484e-06, "loss": 1.1536, "step": 3903 }, { "epoch": 0.12, "learning_rate": 4.900046411073019e-06, "loss": 1.2698, "step": 3904 }, { "epoch": 0.12, "learning_rate": 4.899978117563268e-06, "loss": 1.0598, "step": 3905 }, { "epoch": 0.12, "learning_rate": 4.8999098012068825e-06, "loss": 1.095, "step": 3906 }, { "epoch": 0.12, "learning_rate": 4.8998414620045095e-06, "loss": 1.1445, "step": 3907 }, { "epoch": 0.12, "learning_rate": 4.899773099956804e-06, "loss": 1.1417, "step": 3908 }, { "epoch": 0.12, "learning_rate": 4.899704715064413e-06, "loss": 1.2033, "step": 3909 }, { "epoch": 0.12, "learning_rate": 4.899636307327988e-06, "loss": 1.1727, "step": 3910 }, { "epoch": 0.12, "learning_rate": 4.899567876748182e-06, "loss": 1.1395, "step": 3911 }, { "epoch": 0.12, "learning_rate": 4.8994994233256465e-06, "loss": 1.1589, "step": 3912 }, { "epoch": 0.12, "learning_rate": 4.899430947061031e-06, "loss": 1.1224, "step": 3913 }, { "epoch": 0.12, "learning_rate": 4.899362447954988e-06, "loss": 1.181, "step": 3914 }, { "epoch": 0.12, "learning_rate": 4.899293926008171e-06, "loss": 1.1449, "step": 3915 }, { "epoch": 0.12, "learning_rate": 4.899225381221231e-06, "loss": 1.1795, "step": 3916 }, { "epoch": 0.12, "learning_rate": 4.899156813594821e-06, "loss": 1.2145, "step": 3917 }, { "epoch": 0.12, "learning_rate": 4.899088223129593e-06, "loss": 1.2585, "step": 3918 }, { "epoch": 0.12, "learning_rate": 4.899019609826202e-06, "loss": 1.1042, "step": 3919 }, { "epoch": 0.12, "learning_rate": 4.898950973685299e-06, "loss": 1.1929, "step": 3920 }, { "epoch": 0.12, "learning_rate": 4.8988823147075374e-06, "loss": 1.0876, "step": 3921 }, { "epoch": 0.12, "learning_rate": 4.898813632893572e-06, "loss": 1.1376, "step": 3922 }, { "epoch": 0.12, "learning_rate": 4.898744928244056e-06, "loss": 1.2063, "step": 3923 }, { "epoch": 0.12, "learning_rate": 4.898676200759645e-06, "loss": 1.1913, "step": 3924 }, { "epoch": 0.12, "learning_rate": 4.89860745044099e-06, "loss": 1.197, "step": 3925 }, { "epoch": 0.12, "learning_rate": 4.898538677288748e-06, "loss": 1.2088, "step": 3926 }, { "epoch": 0.12, "learning_rate": 4.8984698813035725e-06, "loss": 1.1063, "step": 3927 }, { "epoch": 0.12, "learning_rate": 4.898401062486119e-06, "loss": 1.1101, "step": 3928 }, { "epoch": 0.12, "learning_rate": 4.898332220837043e-06, "loss": 1.1447, "step": 3929 }, { "epoch": 0.12, "learning_rate": 4.898263356356999e-06, "loss": 1.2487, "step": 3930 }, { "epoch": 0.12, "learning_rate": 4.898194469046643e-06, "loss": 1.2354, "step": 3931 }, { "epoch": 0.12, "learning_rate": 4.8981255589066305e-06, "loss": 1.1313, "step": 3932 }, { "epoch": 0.12, "learning_rate": 4.8980566259376175e-06, "loss": 1.2632, "step": 3933 }, { "epoch": 0.12, "learning_rate": 4.897987670140261e-06, "loss": 1.1255, "step": 3934 }, { "epoch": 0.12, "learning_rate": 4.897918691515216e-06, "loss": 1.1288, "step": 3935 }, { "epoch": 0.12, "learning_rate": 4.89784969006314e-06, "loss": 1.1811, "step": 3936 }, { "epoch": 0.12, "learning_rate": 4.897780665784691e-06, "loss": 1.1877, "step": 3937 }, { "epoch": 0.12, "learning_rate": 4.8977116186805225e-06, "loss": 1.0468, "step": 3938 }, { "epoch": 0.12, "learning_rate": 4.8976425487512955e-06, "loss": 1.0877, "step": 3939 }, { "epoch": 0.12, "learning_rate": 4.897573455997667e-06, "loss": 1.1125, "step": 3940 }, { "epoch": 0.12, "learning_rate": 4.897504340420293e-06, "loss": 1.1697, "step": 3941 }, { "epoch": 0.12, "learning_rate": 4.897435202019833e-06, "loss": 1.1812, "step": 3942 }, { "epoch": 0.12, "learning_rate": 4.897366040796944e-06, "loss": 1.2584, "step": 3943 }, { "epoch": 0.12, "learning_rate": 4.897296856752285e-06, "loss": 1.1428, "step": 3944 }, { "epoch": 0.12, "learning_rate": 4.897227649886515e-06, "loss": 1.197, "step": 3945 }, { "epoch": 0.12, "learning_rate": 4.897158420200291e-06, "loss": 1.2014, "step": 3946 }, { "epoch": 0.12, "learning_rate": 4.897089167694274e-06, "loss": 1.0443, "step": 3947 }, { "epoch": 0.12, "learning_rate": 4.897019892369123e-06, "loss": 1.0811, "step": 3948 }, { "epoch": 0.12, "learning_rate": 4.896950594225497e-06, "loss": 1.0956, "step": 3949 }, { "epoch": 0.12, "learning_rate": 4.8968812732640555e-06, "loss": 1.2426, "step": 3950 }, { "epoch": 0.12, "learning_rate": 4.896811929485459e-06, "loss": 1.1926, "step": 3951 }, { "epoch": 0.12, "learning_rate": 4.896742562890366e-06, "loss": 1.1155, "step": 3952 }, { "epoch": 0.12, "learning_rate": 4.89667317347944e-06, "loss": 1.123, "step": 3953 }, { "epoch": 0.12, "learning_rate": 4.896603761253339e-06, "loss": 1.2751, "step": 3954 }, { "epoch": 0.12, "learning_rate": 4.896534326212724e-06, "loss": 1.0615, "step": 3955 }, { "epoch": 0.12, "learning_rate": 4.8964648683582565e-06, "loss": 1.1392, "step": 3956 }, { "epoch": 0.12, "learning_rate": 4.8963953876905975e-06, "loss": 1.1644, "step": 3957 }, { "epoch": 0.12, "learning_rate": 4.896325884210409e-06, "loss": 1.2327, "step": 3958 }, { "epoch": 0.12, "learning_rate": 4.896256357918352e-06, "loss": 1.0842, "step": 3959 }, { "epoch": 0.12, "learning_rate": 4.896186808815089e-06, "loss": 1.168, "step": 3960 }, { "epoch": 0.12, "learning_rate": 4.896117236901281e-06, "loss": 1.2195, "step": 3961 }, { "epoch": 0.12, "learning_rate": 4.8960476421775915e-06, "loss": 1.1719, "step": 3962 }, { "epoch": 0.12, "learning_rate": 4.895978024644682e-06, "loss": 1.1777, "step": 3963 }, { "epoch": 0.12, "learning_rate": 4.895908384303215e-06, "loss": 1.1725, "step": 3964 }, { "epoch": 0.12, "learning_rate": 4.895838721153855e-06, "loss": 1.2045, "step": 3965 }, { "epoch": 0.12, "learning_rate": 4.895769035197264e-06, "loss": 1.1152, "step": 3966 }, { "epoch": 0.12, "learning_rate": 4.895699326434106e-06, "loss": 1.157, "step": 3967 }, { "epoch": 0.12, "learning_rate": 4.895629594865044e-06, "loss": 1.1582, "step": 3968 }, { "epoch": 0.12, "learning_rate": 4.8955598404907414e-06, "loss": 1.0352, "step": 3969 }, { "epoch": 0.12, "learning_rate": 4.895490063311864e-06, "loss": 1.228, "step": 3970 }, { "epoch": 0.12, "learning_rate": 4.895420263329074e-06, "loss": 1.1202, "step": 3971 }, { "epoch": 0.12, "learning_rate": 4.895350440543037e-06, "loss": 1.129, "step": 3972 }, { "epoch": 0.12, "learning_rate": 4.895280594954417e-06, "loss": 1.2013, "step": 3973 }, { "epoch": 0.12, "learning_rate": 4.89521072656388e-06, "loss": 1.0619, "step": 3974 }, { "epoch": 0.12, "learning_rate": 4.8951408353720905e-06, "loss": 1.1498, "step": 3975 }, { "epoch": 0.12, "learning_rate": 4.895070921379714e-06, "loss": 1.0991, "step": 3976 }, { "epoch": 0.12, "learning_rate": 4.8950009845874156e-06, "loss": 1.0732, "step": 3977 }, { "epoch": 0.12, "learning_rate": 4.89493102499586e-06, "loss": 1.0986, "step": 3978 }, { "epoch": 0.12, "learning_rate": 4.894861042605716e-06, "loss": 1.167, "step": 3979 }, { "epoch": 0.12, "learning_rate": 4.894791037417648e-06, "loss": 1.1758, "step": 3980 }, { "epoch": 0.12, "learning_rate": 4.8947210094323224e-06, "loss": 1.172, "step": 3981 }, { "epoch": 0.12, "learning_rate": 4.894650958650406e-06, "loss": 1.0941, "step": 3982 }, { "epoch": 0.12, "learning_rate": 4.894580885072566e-06, "loss": 1.0895, "step": 3983 }, { "epoch": 0.12, "learning_rate": 4.8945107886994706e-06, "loss": 1.1082, "step": 3984 }, { "epoch": 0.12, "learning_rate": 4.8944406695317835e-06, "loss": 1.2477, "step": 3985 }, { "epoch": 0.12, "learning_rate": 4.894370527570176e-06, "loss": 1.0917, "step": 3986 }, { "epoch": 0.12, "learning_rate": 4.8943003628153125e-06, "loss": 1.247, "step": 3987 }, { "epoch": 0.12, "learning_rate": 4.894230175267864e-06, "loss": 1.1047, "step": 3988 }, { "epoch": 0.12, "learning_rate": 4.894159964928498e-06, "loss": 1.1296, "step": 3989 }, { "epoch": 0.12, "learning_rate": 4.894089731797881e-06, "loss": 1.1556, "step": 3990 }, { "epoch": 0.12, "learning_rate": 4.894019475876684e-06, "loss": 1.1533, "step": 3991 }, { "epoch": 0.12, "learning_rate": 4.893949197165572e-06, "loss": 1.1746, "step": 3992 }, { "epoch": 0.12, "learning_rate": 4.893878895665219e-06, "loss": 1.0939, "step": 3993 }, { "epoch": 0.12, "learning_rate": 4.893808571376291e-06, "loss": 1.1954, "step": 3994 }, { "epoch": 0.12, "learning_rate": 4.893738224299459e-06, "loss": 1.1938, "step": 3995 }, { "epoch": 0.12, "learning_rate": 4.893667854435391e-06, "loss": 1.1179, "step": 3996 }, { "epoch": 0.12, "learning_rate": 4.893597461784758e-06, "loss": 1.1261, "step": 3997 }, { "epoch": 0.12, "learning_rate": 4.893527046348231e-06, "loss": 1.1122, "step": 3998 }, { "epoch": 0.12, "learning_rate": 4.893456608126478e-06, "loss": 1.1415, "step": 3999 }, { "epoch": 0.12, "learning_rate": 4.893386147120171e-06, "loss": 1.1734, "step": 4000 }, { "epoch": 0.12, "learning_rate": 4.893315663329982e-06, "loss": 1.1876, "step": 4001 }, { "epoch": 0.12, "learning_rate": 4.893245156756578e-06, "loss": 1.0404, "step": 4002 }, { "epoch": 0.12, "learning_rate": 4.893174627400635e-06, "loss": 1.1534, "step": 4003 }, { "epoch": 0.12, "learning_rate": 4.893104075262821e-06, "loss": 1.2225, "step": 4004 }, { "epoch": 0.12, "learning_rate": 4.893033500343809e-06, "loss": 1.1874, "step": 4005 }, { "epoch": 0.12, "learning_rate": 4.892962902644272e-06, "loss": 1.1133, "step": 4006 }, { "epoch": 0.12, "learning_rate": 4.892892282164878e-06, "loss": 1.218, "step": 4007 }, { "epoch": 0.12, "learning_rate": 4.892821638906304e-06, "loss": 1.0092, "step": 4008 }, { "epoch": 0.12, "learning_rate": 4.89275097286922e-06, "loss": 1.1348, "step": 4009 }, { "epoch": 0.12, "learning_rate": 4.892680284054299e-06, "loss": 1.2776, "step": 4010 }, { "epoch": 0.12, "learning_rate": 4.892609572462214e-06, "loss": 1.2147, "step": 4011 }, { "epoch": 0.12, "learning_rate": 4.892538838093638e-06, "loss": 1.1154, "step": 4012 }, { "epoch": 0.12, "learning_rate": 4.892468080949244e-06, "loss": 1.1903, "step": 4013 }, { "epoch": 0.12, "learning_rate": 4.8923973010297065e-06, "loss": 1.1724, "step": 4014 }, { "epoch": 0.12, "learning_rate": 4.892326498335699e-06, "loss": 1.1935, "step": 4015 }, { "epoch": 0.12, "learning_rate": 4.892255672867896e-06, "loss": 1.1837, "step": 4016 }, { "epoch": 0.12, "learning_rate": 4.892184824626971e-06, "loss": 1.2003, "step": 4017 }, { "epoch": 0.12, "learning_rate": 4.892113953613598e-06, "loss": 1.0804, "step": 4018 }, { "epoch": 0.12, "learning_rate": 4.892043059828453e-06, "loss": 1.2259, "step": 4019 }, { "epoch": 0.12, "learning_rate": 4.891972143272209e-06, "loss": 1.2004, "step": 4020 }, { "epoch": 0.12, "learning_rate": 4.891901203945543e-06, "loss": 1.1108, "step": 4021 }, { "epoch": 0.12, "learning_rate": 4.89183024184913e-06, "loss": 1.1335, "step": 4022 }, { "epoch": 0.12, "learning_rate": 4.891759256983644e-06, "loss": 1.1189, "step": 4023 }, { "epoch": 0.12, "learning_rate": 4.891688249349762e-06, "loss": 1.1531, "step": 4024 }, { "epoch": 0.12, "learning_rate": 4.8916172189481605e-06, "loss": 1.1503, "step": 4025 }, { "epoch": 0.12, "learning_rate": 4.8915461657795136e-06, "loss": 1.2292, "step": 4026 }, { "epoch": 0.12, "learning_rate": 4.8914750898445e-06, "loss": 1.1169, "step": 4027 }, { "epoch": 0.12, "learning_rate": 4.891403991143795e-06, "loss": 1.0782, "step": 4028 }, { "epoch": 0.12, "learning_rate": 4.891332869678076e-06, "loss": 1.1432, "step": 4029 }, { "epoch": 0.12, "learning_rate": 4.89126172544802e-06, "loss": 1.0563, "step": 4030 }, { "epoch": 0.12, "learning_rate": 4.891190558454303e-06, "loss": 1.1417, "step": 4031 }, { "epoch": 0.12, "learning_rate": 4.891119368697604e-06, "loss": 1.2013, "step": 4032 }, { "epoch": 0.12, "learning_rate": 4.891048156178601e-06, "loss": 1.12, "step": 4033 }, { "epoch": 0.12, "learning_rate": 4.8909769208979705e-06, "loss": 1.1514, "step": 4034 }, { "epoch": 0.12, "learning_rate": 4.8909056628563914e-06, "loss": 1.228, "step": 4035 }, { "epoch": 0.12, "learning_rate": 4.8908343820545415e-06, "loss": 1.2348, "step": 4036 }, { "epoch": 0.12, "learning_rate": 4.8907630784931e-06, "loss": 1.2096, "step": 4037 }, { "epoch": 0.12, "learning_rate": 4.890691752172746e-06, "loss": 1.1274, "step": 4038 }, { "epoch": 0.12, "learning_rate": 4.890620403094158e-06, "loss": 1.0328, "step": 4039 }, { "epoch": 0.12, "learning_rate": 4.8905490312580135e-06, "loss": 1.1226, "step": 4040 }, { "epoch": 0.12, "learning_rate": 4.890477636664994e-06, "loss": 1.0697, "step": 4041 }, { "epoch": 0.12, "learning_rate": 4.890406219315779e-06, "loss": 1.122, "step": 4042 }, { "epoch": 0.12, "learning_rate": 4.890334779211049e-06, "loss": 1.2617, "step": 4043 }, { "epoch": 0.12, "learning_rate": 4.890263316351482e-06, "loss": 1.1417, "step": 4044 }, { "epoch": 0.12, "learning_rate": 4.89019183073776e-06, "loss": 1.2765, "step": 4045 }, { "epoch": 0.12, "learning_rate": 4.890120322370563e-06, "loss": 1.1327, "step": 4046 }, { "epoch": 0.12, "learning_rate": 4.890048791250571e-06, "loss": 1.1147, "step": 4047 }, { "epoch": 0.12, "learning_rate": 4.889977237378466e-06, "loss": 1.2142, "step": 4048 }, { "epoch": 0.12, "learning_rate": 4.889905660754929e-06, "loss": 1.177, "step": 4049 }, { "epoch": 0.12, "learning_rate": 4.889834061380641e-06, "loss": 1.0931, "step": 4050 }, { "epoch": 0.12, "learning_rate": 4.889762439256283e-06, "loss": 1.1876, "step": 4051 }, { "epoch": 0.12, "learning_rate": 4.889690794382539e-06, "loss": 1.1779, "step": 4052 }, { "epoch": 0.12, "learning_rate": 4.889619126760088e-06, "loss": 1.0864, "step": 4053 }, { "epoch": 0.12, "learning_rate": 4.889547436389615e-06, "loss": 1.1389, "step": 4054 }, { "epoch": 0.12, "learning_rate": 4.889475723271801e-06, "loss": 1.2325, "step": 4055 }, { "epoch": 0.12, "learning_rate": 4.889403987407328e-06, "loss": 1.1602, "step": 4056 }, { "epoch": 0.12, "learning_rate": 4.8893322287968805e-06, "loss": 1.0844, "step": 4057 }, { "epoch": 0.12, "learning_rate": 4.889260447441141e-06, "loss": 1.1474, "step": 4058 }, { "epoch": 0.12, "learning_rate": 4.889188643340793e-06, "loss": 1.0902, "step": 4059 }, { "epoch": 0.12, "learning_rate": 4.889116816496519e-06, "loss": 1.2163, "step": 4060 }, { "epoch": 0.12, "learning_rate": 4.889044966909004e-06, "loss": 1.2125, "step": 4061 }, { "epoch": 0.12, "learning_rate": 4.888973094578932e-06, "loss": 1.1246, "step": 4062 }, { "epoch": 0.12, "learning_rate": 4.888901199506985e-06, "loss": 1.1583, "step": 4063 }, { "epoch": 0.12, "learning_rate": 4.888829281693851e-06, "loss": 1.1205, "step": 4064 }, { "epoch": 0.12, "learning_rate": 4.888757341140213e-06, "loss": 1.0894, "step": 4065 }, { "epoch": 0.12, "learning_rate": 4.8886853778467535e-06, "loss": 1.1497, "step": 4066 }, { "epoch": 0.12, "learning_rate": 4.888613391814161e-06, "loss": 1.1808, "step": 4067 }, { "epoch": 0.12, "learning_rate": 4.88854138304312e-06, "loss": 1.1362, "step": 4068 }, { "epoch": 0.12, "learning_rate": 4.888469351534314e-06, "loss": 1.1041, "step": 4069 }, { "epoch": 0.12, "learning_rate": 4.888397297288431e-06, "loss": 1.2537, "step": 4070 }, { "epoch": 0.12, "learning_rate": 4.888325220306155e-06, "loss": 1.1071, "step": 4071 }, { "epoch": 0.12, "learning_rate": 4.888253120588174e-06, "loss": 1.2291, "step": 4072 }, { "epoch": 0.12, "learning_rate": 4.888180998135174e-06, "loss": 1.1534, "step": 4073 }, { "epoch": 0.12, "learning_rate": 4.88810885294784e-06, "loss": 1.2229, "step": 4074 }, { "epoch": 0.12, "learning_rate": 4.88803668502686e-06, "loss": 1.1582, "step": 4075 }, { "epoch": 0.12, "learning_rate": 4.887964494372921e-06, "loss": 1.1866, "step": 4076 }, { "epoch": 0.12, "learning_rate": 4.8878922809867106e-06, "loss": 1.2329, "step": 4077 }, { "epoch": 0.12, "learning_rate": 4.887820044868915e-06, "loss": 1.0984, "step": 4078 }, { "epoch": 0.12, "learning_rate": 4.887747786020224e-06, "loss": 1.153, "step": 4079 }, { "epoch": 0.12, "learning_rate": 4.887675504441323e-06, "loss": 1.1055, "step": 4080 }, { "epoch": 0.12, "learning_rate": 4.887603200132901e-06, "loss": 1.0225, "step": 4081 }, { "epoch": 0.12, "learning_rate": 4.887530873095646e-06, "loss": 1.0971, "step": 4082 }, { "epoch": 0.12, "learning_rate": 4.887458523330248e-06, "loss": 1.1726, "step": 4083 }, { "epoch": 0.12, "learning_rate": 4.8873861508373945e-06, "loss": 1.1087, "step": 4084 }, { "epoch": 0.12, "learning_rate": 4.887313755617774e-06, "loss": 1.1464, "step": 4085 }, { "epoch": 0.12, "learning_rate": 4.887241337672077e-06, "loss": 1.1987, "step": 4086 }, { "epoch": 0.12, "learning_rate": 4.8871688970009924e-06, "loss": 1.1808, "step": 4087 }, { "epoch": 0.12, "learning_rate": 4.887096433605209e-06, "loss": 1.0967, "step": 4088 }, { "epoch": 0.12, "learning_rate": 4.887023947485417e-06, "loss": 1.2094, "step": 4089 }, { "epoch": 0.12, "learning_rate": 4.886951438642307e-06, "loss": 1.1417, "step": 4090 }, { "epoch": 0.12, "learning_rate": 4.886878907076569e-06, "loss": 1.063, "step": 4091 }, { "epoch": 0.12, "learning_rate": 4.886806352788893e-06, "loss": 1.1398, "step": 4092 }, { "epoch": 0.12, "learning_rate": 4.88673377577997e-06, "loss": 1.0142, "step": 4093 }, { "epoch": 0.12, "learning_rate": 4.886661176050492e-06, "loss": 1.1533, "step": 4094 }, { "epoch": 0.12, "learning_rate": 4.886588553601148e-06, "loss": 1.157, "step": 4095 }, { "epoch": 0.12, "learning_rate": 4.886515908432631e-06, "loss": 1.1589, "step": 4096 }, { "epoch": 0.12, "learning_rate": 4.886443240545632e-06, "loss": 1.1262, "step": 4097 }, { "epoch": 0.12, "learning_rate": 4.886370549940842e-06, "loss": 1.1053, "step": 4098 }, { "epoch": 0.12, "learning_rate": 4.8862978366189536e-06, "loss": 1.1027, "step": 4099 }, { "epoch": 0.12, "learning_rate": 4.8862251005806605e-06, "loss": 1.1138, "step": 4100 }, { "epoch": 0.12, "learning_rate": 4.886152341826652e-06, "loss": 1.0983, "step": 4101 }, { "epoch": 0.12, "learning_rate": 4.886079560357624e-06, "loss": 1.166, "step": 4102 }, { "epoch": 0.12, "learning_rate": 4.886006756174267e-06, "loss": 1.1745, "step": 4103 }, { "epoch": 0.12, "learning_rate": 4.885933929277274e-06, "loss": 1.1185, "step": 4104 }, { "epoch": 0.12, "learning_rate": 4.88586107966734e-06, "loss": 1.2009, "step": 4105 }, { "epoch": 0.12, "learning_rate": 4.8857882073451574e-06, "loss": 1.3395, "step": 4106 }, { "epoch": 0.12, "learning_rate": 4.8857153123114194e-06, "loss": 1.1311, "step": 4107 }, { "epoch": 0.12, "learning_rate": 4.885642394566822e-06, "loss": 1.1235, "step": 4108 }, { "epoch": 0.12, "learning_rate": 4.885569454112057e-06, "loss": 1.1445, "step": 4109 }, { "epoch": 0.12, "learning_rate": 4.88549649094782e-06, "loss": 1.1967, "step": 4110 }, { "epoch": 0.12, "learning_rate": 4.885423505074806e-06, "loss": 1.2544, "step": 4111 }, { "epoch": 0.12, "learning_rate": 4.885350496493708e-06, "loss": 1.2159, "step": 4112 }, { "epoch": 0.12, "learning_rate": 4.885277465205223e-06, "loss": 1.0955, "step": 4113 }, { "epoch": 0.12, "learning_rate": 4.885204411210045e-06, "loss": 1.1412, "step": 4114 }, { "epoch": 0.12, "learning_rate": 4.885131334508869e-06, "loss": 1.1579, "step": 4115 }, { "epoch": 0.12, "learning_rate": 4.885058235102392e-06, "loss": 1.037, "step": 4116 }, { "epoch": 0.12, "learning_rate": 4.88498511299131e-06, "loss": 1.1524, "step": 4117 }, { "epoch": 0.12, "learning_rate": 4.8849119681763165e-06, "loss": 1.1651, "step": 4118 }, { "epoch": 0.12, "learning_rate": 4.884838800658112e-06, "loss": 1.101, "step": 4119 }, { "epoch": 0.12, "learning_rate": 4.884765610437389e-06, "loss": 1.0972, "step": 4120 }, { "epoch": 0.12, "learning_rate": 4.884692397514846e-06, "loss": 1.2468, "step": 4121 }, { "epoch": 0.12, "learning_rate": 4.884619161891181e-06, "loss": 0.9786, "step": 4122 }, { "epoch": 0.12, "learning_rate": 4.884545903567089e-06, "loss": 1.1702, "step": 4123 }, { "epoch": 0.12, "learning_rate": 4.8844726225432696e-06, "loss": 1.2054, "step": 4124 }, { "epoch": 0.12, "learning_rate": 4.884399318820418e-06, "loss": 1.1476, "step": 4125 }, { "epoch": 0.12, "learning_rate": 4.884325992399234e-06, "loss": 1.055, "step": 4126 }, { "epoch": 0.12, "learning_rate": 4.884252643280415e-06, "loss": 1.0978, "step": 4127 }, { "epoch": 0.12, "learning_rate": 4.884179271464658e-06, "loss": 1.139, "step": 4128 }, { "epoch": 0.12, "learning_rate": 4.884105876952664e-06, "loss": 1.2654, "step": 4129 }, { "epoch": 0.12, "learning_rate": 4.884032459745129e-06, "loss": 1.0324, "step": 4130 }, { "epoch": 0.12, "learning_rate": 4.883959019842754e-06, "loss": 1.1758, "step": 4131 }, { "epoch": 0.12, "learning_rate": 4.8838855572462375e-06, "loss": 1.1523, "step": 4132 }, { "epoch": 0.12, "learning_rate": 4.883812071956277e-06, "loss": 1.2599, "step": 4133 }, { "epoch": 0.12, "learning_rate": 4.883738563973576e-06, "loss": 1.1021, "step": 4134 }, { "epoch": 0.12, "learning_rate": 4.88366503329883e-06, "loss": 1.0729, "step": 4135 }, { "epoch": 0.12, "learning_rate": 4.883591479932742e-06, "loss": 1.1916, "step": 4136 }, { "epoch": 0.12, "learning_rate": 4.883517903876011e-06, "loss": 1.336, "step": 4137 }, { "epoch": 0.12, "learning_rate": 4.883444305129337e-06, "loss": 1.1718, "step": 4138 }, { "epoch": 0.12, "learning_rate": 4.883370683693421e-06, "loss": 1.2034, "step": 4139 }, { "epoch": 0.12, "learning_rate": 4.883297039568965e-06, "loss": 1.1785, "step": 4140 }, { "epoch": 0.12, "learning_rate": 4.883223372756668e-06, "loss": 1.0688, "step": 4141 }, { "epoch": 0.12, "learning_rate": 4.883149683257233e-06, "loss": 1.2617, "step": 4142 }, { "epoch": 0.12, "learning_rate": 4.88307597107136e-06, "loss": 1.1309, "step": 4143 }, { "epoch": 0.12, "learning_rate": 4.883002236199752e-06, "loss": 1.2133, "step": 4144 }, { "epoch": 0.12, "learning_rate": 4.88292847864311e-06, "loss": 1.1431, "step": 4145 }, { "epoch": 0.12, "learning_rate": 4.8828546984021374e-06, "loss": 1.0678, "step": 4146 }, { "epoch": 0.12, "learning_rate": 4.882780895477535e-06, "loss": 0.9812, "step": 4147 }, { "epoch": 0.12, "learning_rate": 4.882707069870006e-06, "loss": 1.137, "step": 4148 }, { "epoch": 0.12, "learning_rate": 4.882633221580254e-06, "loss": 1.0907, "step": 4149 }, { "epoch": 0.13, "learning_rate": 4.88255935060898e-06, "loss": 1.3064, "step": 4150 }, { "epoch": 0.13, "learning_rate": 4.882485456956889e-06, "loss": 1.098, "step": 4151 }, { "epoch": 0.13, "learning_rate": 4.882411540624684e-06, "loss": 1.1996, "step": 4152 }, { "epoch": 0.13, "learning_rate": 4.882337601613069e-06, "loss": 1.2042, "step": 4153 }, { "epoch": 0.13, "learning_rate": 4.882263639922747e-06, "loss": 1.0997, "step": 4154 }, { "epoch": 0.13, "learning_rate": 4.882189655554423e-06, "loss": 1.2757, "step": 4155 }, { "epoch": 0.13, "learning_rate": 4.882115648508799e-06, "loss": 1.1718, "step": 4156 }, { "epoch": 0.13, "learning_rate": 4.882041618786584e-06, "loss": 1.1926, "step": 4157 }, { "epoch": 0.13, "learning_rate": 4.881967566388478e-06, "loss": 1.226, "step": 4158 }, { "epoch": 0.13, "learning_rate": 4.881893491315189e-06, "loss": 1.1592, "step": 4159 }, { "epoch": 0.13, "learning_rate": 4.8818193935674205e-06, "loss": 1.1634, "step": 4160 }, { "epoch": 0.13, "learning_rate": 4.881745273145878e-06, "loss": 1.2126, "step": 4161 }, { "epoch": 0.13, "learning_rate": 4.881671130051269e-06, "loss": 1.2307, "step": 4162 }, { "epoch": 0.13, "learning_rate": 4.881596964284296e-06, "loss": 1.1863, "step": 4163 }, { "epoch": 0.13, "learning_rate": 4.881522775845668e-06, "loss": 1.213, "step": 4164 }, { "epoch": 0.13, "learning_rate": 4.881448564736091e-06, "loss": 1.1617, "step": 4165 }, { "epoch": 0.13, "learning_rate": 4.88137433095627e-06, "loss": 1.1786, "step": 4166 }, { "epoch": 0.13, "learning_rate": 4.881300074506911e-06, "loss": 1.2489, "step": 4167 }, { "epoch": 0.13, "learning_rate": 4.881225795388724e-06, "loss": 1.3007, "step": 4168 }, { "epoch": 0.13, "learning_rate": 4.881151493602414e-06, "loss": 1.1987, "step": 4169 }, { "epoch": 0.13, "learning_rate": 4.881077169148688e-06, "loss": 1.1752, "step": 4170 }, { "epoch": 0.13, "learning_rate": 4.881002822028254e-06, "loss": 1.0709, "step": 4171 }, { "epoch": 0.13, "learning_rate": 4.88092845224182e-06, "loss": 1.1283, "step": 4172 }, { "epoch": 0.13, "learning_rate": 4.880854059790094e-06, "loss": 1.224, "step": 4173 }, { "epoch": 0.13, "learning_rate": 4.880779644673784e-06, "loss": 1.1805, "step": 4174 }, { "epoch": 0.13, "learning_rate": 4.880705206893599e-06, "loss": 1.1976, "step": 4175 }, { "epoch": 0.13, "learning_rate": 4.880630746450245e-06, "loss": 1.1667, "step": 4176 }, { "epoch": 0.13, "learning_rate": 4.880556263344435e-06, "loss": 1.1454, "step": 4177 }, { "epoch": 0.13, "learning_rate": 4.880481757576875e-06, "loss": 1.1029, "step": 4178 }, { "epoch": 0.13, "learning_rate": 4.880407229148275e-06, "loss": 1.1609, "step": 4179 }, { "epoch": 0.13, "learning_rate": 4.8803326780593455e-06, "loss": 1.1821, "step": 4180 }, { "epoch": 0.13, "learning_rate": 4.880258104310794e-06, "loss": 0.9508, "step": 4181 }, { "epoch": 0.13, "learning_rate": 4.8801835079033326e-06, "loss": 1.1859, "step": 4182 }, { "epoch": 0.13, "learning_rate": 4.88010888883767e-06, "loss": 1.2905, "step": 4183 }, { "epoch": 0.13, "learning_rate": 4.880034247114518e-06, "loss": 1.1789, "step": 4184 }, { "epoch": 0.13, "learning_rate": 4.879959582734586e-06, "loss": 1.1615, "step": 4185 }, { "epoch": 0.13, "learning_rate": 4.879884895698584e-06, "loss": 1.2493, "step": 4186 }, { "epoch": 0.13, "learning_rate": 4.879810186007224e-06, "loss": 1.2539, "step": 4187 }, { "epoch": 0.13, "learning_rate": 4.879735453661218e-06, "loss": 1.1249, "step": 4188 }, { "epoch": 0.13, "learning_rate": 4.879660698661277e-06, "loss": 1.1834, "step": 4189 }, { "epoch": 0.13, "learning_rate": 4.879585921008112e-06, "loss": 1.167, "step": 4190 }, { "epoch": 0.13, "learning_rate": 4.879511120702434e-06, "loss": 1.0361, "step": 4191 }, { "epoch": 0.13, "learning_rate": 4.879436297744957e-06, "loss": 1.1508, "step": 4192 }, { "epoch": 0.13, "learning_rate": 4.879361452136393e-06, "loss": 1.18, "step": 4193 }, { "epoch": 0.13, "learning_rate": 4.879286583877453e-06, "loss": 1.2233, "step": 4194 }, { "epoch": 0.13, "learning_rate": 4.87921169296885e-06, "loss": 1.147, "step": 4195 }, { "epoch": 0.13, "learning_rate": 4.879136779411299e-06, "loss": 1.0934, "step": 4196 }, { "epoch": 0.13, "learning_rate": 4.8790618432055116e-06, "loss": 1.1295, "step": 4197 }, { "epoch": 0.13, "learning_rate": 4.8789868843522e-06, "loss": 1.2505, "step": 4198 }, { "epoch": 0.13, "learning_rate": 4.87891190285208e-06, "loss": 1.1937, "step": 4199 }, { "epoch": 0.13, "learning_rate": 4.878836898705864e-06, "loss": 1.1852, "step": 4200 }, { "epoch": 0.13, "learning_rate": 4.878761871914266e-06, "loss": 1.2021, "step": 4201 }, { "epoch": 0.13, "learning_rate": 4.878686822478001e-06, "loss": 1.2222, "step": 4202 }, { "epoch": 0.13, "learning_rate": 4.8786117503977834e-06, "loss": 1.1656, "step": 4203 }, { "epoch": 0.13, "learning_rate": 4.878536655674328e-06, "loss": 1.0982, "step": 4204 }, { "epoch": 0.13, "learning_rate": 4.878461538308349e-06, "loss": 1.0957, "step": 4205 }, { "epoch": 0.13, "learning_rate": 4.878386398300561e-06, "loss": 1.2013, "step": 4206 }, { "epoch": 0.13, "learning_rate": 4.878311235651681e-06, "loss": 1.1295, "step": 4207 }, { "epoch": 0.13, "learning_rate": 4.878236050362422e-06, "loss": 1.2281, "step": 4208 }, { "epoch": 0.13, "learning_rate": 4.8781608424335015e-06, "loss": 1.1954, "step": 4209 }, { "epoch": 0.13, "learning_rate": 4.878085611865636e-06, "loss": 1.1828, "step": 4210 }, { "epoch": 0.13, "learning_rate": 4.87801035865954e-06, "loss": 1.2416, "step": 4211 }, { "epoch": 0.13, "learning_rate": 4.877935082815931e-06, "loss": 1.2924, "step": 4212 }, { "epoch": 0.13, "learning_rate": 4.877859784335524e-06, "loss": 1.1809, "step": 4213 }, { "epoch": 0.13, "learning_rate": 4.8777844632190395e-06, "loss": 1.2399, "step": 4214 }, { "epoch": 0.13, "learning_rate": 4.877709119467191e-06, "loss": 1.1171, "step": 4215 }, { "epoch": 0.13, "learning_rate": 4.8776337530806964e-06, "loss": 1.1984, "step": 4216 }, { "epoch": 0.13, "learning_rate": 4.877558364060274e-06, "loss": 1.2059, "step": 4217 }, { "epoch": 0.13, "learning_rate": 4.8774829524066405e-06, "loss": 1.0714, "step": 4218 }, { "epoch": 0.13, "learning_rate": 4.877407518120515e-06, "loss": 1.1762, "step": 4219 }, { "epoch": 0.13, "learning_rate": 4.8773320612026145e-06, "loss": 1.1685, "step": 4220 }, { "epoch": 0.13, "learning_rate": 4.8772565816536585e-06, "loss": 1.1329, "step": 4221 }, { "epoch": 0.13, "learning_rate": 4.877181079474363e-06, "loss": 1.0903, "step": 4222 }, { "epoch": 0.13, "learning_rate": 4.87710555466545e-06, "loss": 1.1302, "step": 4223 }, { "epoch": 0.13, "learning_rate": 4.877030007227637e-06, "loss": 1.2058, "step": 4224 }, { "epoch": 0.13, "learning_rate": 4.8769544371616425e-06, "loss": 1.312, "step": 4225 }, { "epoch": 0.13, "learning_rate": 4.876878844468188e-06, "loss": 1.1406, "step": 4226 }, { "epoch": 0.13, "learning_rate": 4.87680322914799e-06, "loss": 1.1631, "step": 4227 }, { "epoch": 0.13, "learning_rate": 4.87672759120177e-06, "loss": 1.2515, "step": 4228 }, { "epoch": 0.13, "learning_rate": 4.8766519306302486e-06, "loss": 1.1413, "step": 4229 }, { "epoch": 0.13, "learning_rate": 4.876576247434146e-06, "loss": 1.0261, "step": 4230 }, { "epoch": 0.13, "learning_rate": 4.876500541614181e-06, "loss": 1.2444, "step": 4231 }, { "epoch": 0.13, "learning_rate": 4.876424813171076e-06, "loss": 1.2223, "step": 4232 }, { "epoch": 0.13, "learning_rate": 4.876349062105551e-06, "loss": 1.2276, "step": 4233 }, { "epoch": 0.13, "learning_rate": 4.8762732884183274e-06, "loss": 1.0512, "step": 4234 }, { "epoch": 0.13, "learning_rate": 4.876197492110128e-06, "loss": 1.2161, "step": 4235 }, { "epoch": 0.13, "learning_rate": 4.876121673181671e-06, "loss": 1.2219, "step": 4236 }, { "epoch": 0.13, "learning_rate": 4.87604583163368e-06, "loss": 1.224, "step": 4237 }, { "epoch": 0.13, "learning_rate": 4.875969967466878e-06, "loss": 1.1592, "step": 4238 }, { "epoch": 0.13, "learning_rate": 4.875894080681986e-06, "loss": 1.1486, "step": 4239 }, { "epoch": 0.13, "learning_rate": 4.875818171279727e-06, "loss": 1.0609, "step": 4240 }, { "epoch": 0.13, "learning_rate": 4.875742239260822e-06, "loss": 1.0656, "step": 4241 }, { "epoch": 0.13, "learning_rate": 4.875666284625996e-06, "loss": 1.1224, "step": 4242 }, { "epoch": 0.13, "learning_rate": 4.875590307375972e-06, "loss": 1.2579, "step": 4243 }, { "epoch": 0.13, "learning_rate": 4.875514307511471e-06, "loss": 1.1915, "step": 4244 }, { "epoch": 0.13, "learning_rate": 4.875438285033218e-06, "loss": 1.1146, "step": 4245 }, { "epoch": 0.13, "learning_rate": 4.875362239941936e-06, "loss": 1.1901, "step": 4246 }, { "epoch": 0.13, "learning_rate": 4.875286172238351e-06, "loss": 1.1749, "step": 4247 }, { "epoch": 0.13, "learning_rate": 4.875210081923185e-06, "loss": 1.0933, "step": 4248 }, { "epoch": 0.13, "learning_rate": 4.8751339689971624e-06, "loss": 1.0839, "step": 4249 }, { "epoch": 0.13, "learning_rate": 4.875057833461009e-06, "loss": 1.1107, "step": 4250 }, { "epoch": 0.13, "learning_rate": 4.874981675315449e-06, "loss": 1.1796, "step": 4251 }, { "epoch": 0.13, "learning_rate": 4.874905494561207e-06, "loss": 1.1693, "step": 4252 }, { "epoch": 0.13, "learning_rate": 4.874829291199008e-06, "loss": 1.1711, "step": 4253 }, { "epoch": 0.13, "learning_rate": 4.874753065229579e-06, "loss": 1.1132, "step": 4254 }, { "epoch": 0.13, "learning_rate": 4.874676816653644e-06, "loss": 1.1769, "step": 4255 }, { "epoch": 0.13, "learning_rate": 4.874600545471929e-06, "loss": 1.0264, "step": 4256 }, { "epoch": 0.13, "learning_rate": 4.874524251685161e-06, "loss": 1.2208, "step": 4257 }, { "epoch": 0.13, "learning_rate": 4.8744479352940655e-06, "loss": 1.1143, "step": 4258 }, { "epoch": 0.13, "learning_rate": 4.8743715962993696e-06, "loss": 1.1293, "step": 4259 }, { "epoch": 0.13, "learning_rate": 4.874295234701799e-06, "loss": 1.1907, "step": 4260 }, { "epoch": 0.13, "learning_rate": 4.8742188505020816e-06, "loss": 1.2192, "step": 4261 }, { "epoch": 0.13, "learning_rate": 4.874142443700944e-06, "loss": 1.1507, "step": 4262 }, { "epoch": 0.13, "learning_rate": 4.874066014299114e-06, "loss": 1.1519, "step": 4263 }, { "epoch": 0.13, "learning_rate": 4.873989562297319e-06, "loss": 1.2247, "step": 4264 }, { "epoch": 0.13, "learning_rate": 4.873913087696286e-06, "loss": 1.1776, "step": 4265 }, { "epoch": 0.13, "learning_rate": 4.873836590496745e-06, "loss": 1.1535, "step": 4266 }, { "epoch": 0.13, "learning_rate": 4.873760070699421e-06, "loss": 1.0657, "step": 4267 }, { "epoch": 0.13, "learning_rate": 4.873683528305046e-06, "loss": 1.1834, "step": 4268 }, { "epoch": 0.13, "learning_rate": 4.873606963314347e-06, "loss": 1.188, "step": 4269 }, { "epoch": 0.13, "learning_rate": 4.8735303757280525e-06, "loss": 1.1547, "step": 4270 }, { "epoch": 0.13, "learning_rate": 4.873453765546892e-06, "loss": 1.1858, "step": 4271 }, { "epoch": 0.13, "learning_rate": 4.873377132771595e-06, "loss": 1.1565, "step": 4272 }, { "epoch": 0.13, "learning_rate": 4.87330047740289e-06, "loss": 1.222, "step": 4273 }, { "epoch": 0.13, "learning_rate": 4.873223799441508e-06, "loss": 1.0419, "step": 4274 }, { "epoch": 0.13, "learning_rate": 4.873147098888178e-06, "loss": 1.198, "step": 4275 }, { "epoch": 0.13, "learning_rate": 4.873070375743631e-06, "loss": 1.1814, "step": 4276 }, { "epoch": 0.13, "learning_rate": 4.872993630008597e-06, "loss": 1.1258, "step": 4277 }, { "epoch": 0.13, "learning_rate": 4.872916861683806e-06, "loss": 1.1057, "step": 4278 }, { "epoch": 0.13, "learning_rate": 4.872840070769989e-06, "loss": 1.2677, "step": 4279 }, { "epoch": 0.13, "learning_rate": 4.8727632572678794e-06, "loss": 1.2234, "step": 4280 }, { "epoch": 0.13, "learning_rate": 4.8726864211782044e-06, "loss": 1.3337, "step": 4281 }, { "epoch": 0.13, "learning_rate": 4.872609562501698e-06, "loss": 1.1034, "step": 4282 }, { "epoch": 0.13, "learning_rate": 4.872532681239092e-06, "loss": 1.2102, "step": 4283 }, { "epoch": 0.13, "learning_rate": 4.872455777391116e-06, "loss": 1.2267, "step": 4284 }, { "epoch": 0.13, "learning_rate": 4.8723788509585045e-06, "loss": 1.1737, "step": 4285 }, { "epoch": 0.13, "learning_rate": 4.872301901941988e-06, "loss": 1.3625, "step": 4286 }, { "epoch": 0.13, "learning_rate": 4.8722249303423006e-06, "loss": 1.241, "step": 4287 }, { "epoch": 0.13, "learning_rate": 4.872147936160175e-06, "loss": 1.1666, "step": 4288 }, { "epoch": 0.13, "learning_rate": 4.872070919396343e-06, "loss": 1.1943, "step": 4289 }, { "epoch": 0.13, "learning_rate": 4.8719938800515385e-06, "loss": 1.0807, "step": 4290 }, { "epoch": 0.13, "learning_rate": 4.871916818126494e-06, "loss": 1.2158, "step": 4291 }, { "epoch": 0.13, "learning_rate": 4.871839733621944e-06, "loss": 1.1457, "step": 4292 }, { "epoch": 0.13, "learning_rate": 4.871762626538623e-06, "loss": 1.1304, "step": 4293 }, { "epoch": 0.13, "learning_rate": 4.871685496877263e-06, "loss": 1.1853, "step": 4294 }, { "epoch": 0.13, "learning_rate": 4.871608344638599e-06, "loss": 1.1467, "step": 4295 }, { "epoch": 0.13, "learning_rate": 4.871531169823367e-06, "loss": 1.1384, "step": 4296 }, { "epoch": 0.13, "learning_rate": 4.8714539724322995e-06, "loss": 1.2599, "step": 4297 }, { "epoch": 0.13, "learning_rate": 4.871376752466132e-06, "loss": 1.2427, "step": 4298 }, { "epoch": 0.13, "learning_rate": 4.871299509925601e-06, "loss": 1.088, "step": 4299 }, { "epoch": 0.13, "learning_rate": 4.87122224481144e-06, "loss": 1.2693, "step": 4300 }, { "epoch": 0.13, "learning_rate": 4.871144957124385e-06, "loss": 1.1602, "step": 4301 }, { "epoch": 0.13, "learning_rate": 4.8710676468651726e-06, "loss": 1.1693, "step": 4302 }, { "epoch": 0.13, "learning_rate": 4.8709903140345385e-06, "loss": 1.1224, "step": 4303 }, { "epoch": 0.13, "learning_rate": 4.870912958633218e-06, "loss": 1.0977, "step": 4304 }, { "epoch": 0.13, "learning_rate": 4.870835580661948e-06, "loss": 1.2683, "step": 4305 }, { "epoch": 0.13, "learning_rate": 4.870758180121466e-06, "loss": 1.2826, "step": 4306 }, { "epoch": 0.13, "learning_rate": 4.870680757012506e-06, "loss": 1.1099, "step": 4307 }, { "epoch": 0.13, "learning_rate": 4.870603311335808e-06, "loss": 1.1731, "step": 4308 }, { "epoch": 0.13, "learning_rate": 4.870525843092109e-06, "loss": 1.1624, "step": 4309 }, { "epoch": 0.13, "learning_rate": 4.870448352282144e-06, "loss": 1.2244, "step": 4310 }, { "epoch": 0.13, "learning_rate": 4.870370838906653e-06, "loss": 1.1549, "step": 4311 }, { "epoch": 0.13, "learning_rate": 4.870293302966373e-06, "loss": 1.2011, "step": 4312 }, { "epoch": 0.13, "learning_rate": 4.870215744462044e-06, "loss": 1.0621, "step": 4313 }, { "epoch": 0.13, "learning_rate": 4.870138163394401e-06, "loss": 1.1668, "step": 4314 }, { "epoch": 0.13, "learning_rate": 4.870060559764185e-06, "loss": 1.1932, "step": 4315 }, { "epoch": 0.13, "learning_rate": 4.869982933572132e-06, "loss": 1.2689, "step": 4316 }, { "epoch": 0.13, "learning_rate": 4.869905284818985e-06, "loss": 1.1056, "step": 4317 }, { "epoch": 0.13, "learning_rate": 4.869827613505481e-06, "loss": 1.0836, "step": 4318 }, { "epoch": 0.13, "learning_rate": 4.869749919632359e-06, "loss": 1.1628, "step": 4319 }, { "epoch": 0.13, "learning_rate": 4.869672203200358e-06, "loss": 1.1539, "step": 4320 }, { "epoch": 0.13, "learning_rate": 4.869594464210221e-06, "loss": 1.1041, "step": 4321 }, { "epoch": 0.13, "learning_rate": 4.869516702662684e-06, "loss": 1.0934, "step": 4322 }, { "epoch": 0.13, "learning_rate": 4.869438918558491e-06, "loss": 1.1257, "step": 4323 }, { "epoch": 0.13, "learning_rate": 4.86936111189838e-06, "loss": 1.1075, "step": 4324 }, { "epoch": 0.13, "learning_rate": 4.869283282683092e-06, "loss": 1.1183, "step": 4325 }, { "epoch": 0.13, "learning_rate": 4.869205430913368e-06, "loss": 1.1434, "step": 4326 }, { "epoch": 0.13, "learning_rate": 4.869127556589949e-06, "loss": 1.0271, "step": 4327 }, { "epoch": 0.13, "learning_rate": 4.869049659713577e-06, "loss": 1.1265, "step": 4328 }, { "epoch": 0.13, "learning_rate": 4.868971740284994e-06, "loss": 1.0618, "step": 4329 }, { "epoch": 0.13, "learning_rate": 4.86889379830494e-06, "loss": 1.061, "step": 4330 }, { "epoch": 0.13, "learning_rate": 4.8688158337741585e-06, "loss": 1.2793, "step": 4331 }, { "epoch": 0.13, "learning_rate": 4.868737846693391e-06, "loss": 1.2338, "step": 4332 }, { "epoch": 0.13, "learning_rate": 4.8686598370633805e-06, "loss": 1.2059, "step": 4333 }, { "epoch": 0.13, "learning_rate": 4.868581804884869e-06, "loss": 1.0229, "step": 4334 }, { "epoch": 0.13, "learning_rate": 4.868503750158599e-06, "loss": 1.1354, "step": 4335 }, { "epoch": 0.13, "learning_rate": 4.868425672885314e-06, "loss": 1.1547, "step": 4336 }, { "epoch": 0.13, "learning_rate": 4.868347573065758e-06, "loss": 1.1093, "step": 4337 }, { "epoch": 0.13, "learning_rate": 4.868269450700673e-06, "loss": 1.1501, "step": 4338 }, { "epoch": 0.13, "learning_rate": 4.868191305790803e-06, "loss": 1.1541, "step": 4339 }, { "epoch": 0.13, "learning_rate": 4.868113138336893e-06, "loss": 1.1568, "step": 4340 }, { "epoch": 0.13, "learning_rate": 4.868034948339686e-06, "loss": 1.1688, "step": 4341 }, { "epoch": 0.13, "learning_rate": 4.867956735799928e-06, "loss": 1.169, "step": 4342 }, { "epoch": 0.13, "learning_rate": 4.867878500718362e-06, "loss": 1.1708, "step": 4343 }, { "epoch": 0.13, "learning_rate": 4.867800243095732e-06, "loss": 1.2352, "step": 4344 }, { "epoch": 0.13, "learning_rate": 4.867721962932785e-06, "loss": 1.2202, "step": 4345 }, { "epoch": 0.13, "learning_rate": 4.867643660230264e-06, "loss": 1.0713, "step": 4346 }, { "epoch": 0.13, "learning_rate": 4.8675653349889165e-06, "loss": 1.1041, "step": 4347 }, { "epoch": 0.13, "learning_rate": 4.867486987209487e-06, "loss": 1.2094, "step": 4348 }, { "epoch": 0.13, "learning_rate": 4.867408616892723e-06, "loss": 1.1517, "step": 4349 }, { "epoch": 0.13, "learning_rate": 4.867330224039367e-06, "loss": 1.2734, "step": 4350 }, { "epoch": 0.13, "learning_rate": 4.867251808650169e-06, "loss": 1.171, "step": 4351 }, { "epoch": 0.13, "learning_rate": 4.867173370725873e-06, "loss": 1.1459, "step": 4352 }, { "epoch": 0.13, "learning_rate": 4.867094910267227e-06, "loss": 1.0267, "step": 4353 }, { "epoch": 0.13, "learning_rate": 4.867016427274978e-06, "loss": 1.1841, "step": 4354 }, { "epoch": 0.13, "learning_rate": 4.866937921749871e-06, "loss": 1.2458, "step": 4355 }, { "epoch": 0.13, "learning_rate": 4.8668593936926564e-06, "loss": 1.2236, "step": 4356 }, { "epoch": 0.13, "learning_rate": 4.86678084310408e-06, "loss": 1.1877, "step": 4357 }, { "epoch": 0.13, "learning_rate": 4.86670226998489e-06, "loss": 1.1205, "step": 4358 }, { "epoch": 0.13, "learning_rate": 4.8666236743358336e-06, "loss": 1.1273, "step": 4359 }, { "epoch": 0.13, "learning_rate": 4.86654505615766e-06, "loss": 1.188, "step": 4360 }, { "epoch": 0.13, "learning_rate": 4.866466415451117e-06, "loss": 1.1445, "step": 4361 }, { "epoch": 0.13, "learning_rate": 4.866387752216953e-06, "loss": 1.0806, "step": 4362 }, { "epoch": 0.13, "learning_rate": 4.866309066455919e-06, "loss": 1.1771, "step": 4363 }, { "epoch": 0.13, "learning_rate": 4.866230358168761e-06, "loss": 1.2717, "step": 4364 }, { "epoch": 0.13, "learning_rate": 4.86615162735623e-06, "loss": 1.0381, "step": 4365 }, { "epoch": 0.13, "learning_rate": 4.866072874019075e-06, "loss": 1.2195, "step": 4366 }, { "epoch": 0.13, "learning_rate": 4.865994098158045e-06, "loss": 1.3088, "step": 4367 }, { "epoch": 0.13, "learning_rate": 4.8659152997738925e-06, "loss": 1.2476, "step": 4368 }, { "epoch": 0.13, "learning_rate": 4.865836478867364e-06, "loss": 1.0562, "step": 4369 }, { "epoch": 0.13, "learning_rate": 4.865757635439212e-06, "loss": 1.1572, "step": 4370 }, { "epoch": 0.13, "learning_rate": 4.8656787694901875e-06, "loss": 1.1261, "step": 4371 }, { "epoch": 0.13, "learning_rate": 4.865599881021041e-06, "loss": 1.1317, "step": 4372 }, { "epoch": 0.13, "learning_rate": 4.865520970032521e-06, "loss": 1.2618, "step": 4373 }, { "epoch": 0.13, "learning_rate": 4.865442036525382e-06, "loss": 1.1238, "step": 4374 }, { "epoch": 0.13, "learning_rate": 4.865363080500374e-06, "loss": 1.2998, "step": 4375 }, { "epoch": 0.13, "learning_rate": 4.865284101958247e-06, "loss": 1.1365, "step": 4376 }, { "epoch": 0.13, "learning_rate": 4.865205100899757e-06, "loss": 1.2214, "step": 4377 }, { "epoch": 0.13, "learning_rate": 4.865126077325653e-06, "loss": 1.1031, "step": 4378 }, { "epoch": 0.13, "learning_rate": 4.8650470312366865e-06, "loss": 1.1521, "step": 4379 }, { "epoch": 0.13, "learning_rate": 4.8649679626336125e-06, "loss": 1.2234, "step": 4380 }, { "epoch": 0.13, "learning_rate": 4.864888871517182e-06, "loss": 1.1211, "step": 4381 }, { "epoch": 0.13, "learning_rate": 4.864809757888148e-06, "loss": 1.2388, "step": 4382 }, { "epoch": 0.13, "learning_rate": 4.8647306217472645e-06, "loss": 1.2335, "step": 4383 }, { "epoch": 0.13, "learning_rate": 4.8646514630952844e-06, "loss": 1.1469, "step": 4384 }, { "epoch": 0.13, "learning_rate": 4.864572281932961e-06, "loss": 1.1099, "step": 4385 }, { "epoch": 0.13, "learning_rate": 4.864493078261049e-06, "loss": 1.1835, "step": 4386 }, { "epoch": 0.13, "learning_rate": 4.864413852080301e-06, "loss": 1.2098, "step": 4387 }, { "epoch": 0.13, "learning_rate": 4.864334603391472e-06, "loss": 1.1459, "step": 4388 }, { "epoch": 0.13, "learning_rate": 4.864255332195316e-06, "loss": 1.1667, "step": 4389 }, { "epoch": 0.13, "learning_rate": 4.864176038492588e-06, "loss": 1.1063, "step": 4390 }, { "epoch": 0.13, "learning_rate": 4.8640967222840435e-06, "loss": 1.0739, "step": 4391 }, { "epoch": 0.13, "learning_rate": 4.8640173835704364e-06, "loss": 1.1476, "step": 4392 }, { "epoch": 0.13, "learning_rate": 4.863938022352523e-06, "loss": 1.0921, "step": 4393 }, { "epoch": 0.13, "learning_rate": 4.863858638631057e-06, "loss": 1.1912, "step": 4394 }, { "epoch": 0.13, "learning_rate": 4.863779232406795e-06, "loss": 1.0609, "step": 4395 }, { "epoch": 0.13, "learning_rate": 4.8636998036804935e-06, "loss": 1.1083, "step": 4396 }, { "epoch": 0.13, "learning_rate": 4.863620352452909e-06, "loss": 1.0875, "step": 4397 }, { "epoch": 0.13, "learning_rate": 4.863540878724796e-06, "loss": 1.1307, "step": 4398 }, { "epoch": 0.13, "learning_rate": 4.8634613824969136e-06, "loss": 1.1304, "step": 4399 }, { "epoch": 0.13, "learning_rate": 4.8633818637700155e-06, "loss": 1.3147, "step": 4400 }, { "epoch": 0.13, "learning_rate": 4.863302322544862e-06, "loss": 1.158, "step": 4401 }, { "epoch": 0.13, "learning_rate": 4.863222758822207e-06, "loss": 1.1403, "step": 4402 }, { "epoch": 0.13, "learning_rate": 4.86314317260281e-06, "loss": 1.1918, "step": 4403 }, { "epoch": 0.13, "learning_rate": 4.863063563887428e-06, "loss": 1.1551, "step": 4404 }, { "epoch": 0.13, "learning_rate": 4.8629839326768196e-06, "loss": 1.2122, "step": 4405 }, { "epoch": 0.13, "learning_rate": 4.862904278971742e-06, "loss": 1.1533, "step": 4406 }, { "epoch": 0.13, "learning_rate": 4.8628246027729535e-06, "loss": 1.1146, "step": 4407 }, { "epoch": 0.13, "learning_rate": 4.862744904081213e-06, "loss": 1.1183, "step": 4408 }, { "epoch": 0.13, "learning_rate": 4.862665182897279e-06, "loss": 1.0953, "step": 4409 }, { "epoch": 0.13, "learning_rate": 4.86258543922191e-06, "loss": 1.0938, "step": 4410 }, { "epoch": 0.13, "learning_rate": 4.862505673055865e-06, "loss": 1.0783, "step": 4411 }, { "epoch": 0.13, "learning_rate": 4.862425884399905e-06, "loss": 1.1389, "step": 4412 }, { "epoch": 0.13, "learning_rate": 4.862346073254788e-06, "loss": 1.0842, "step": 4413 }, { "epoch": 0.13, "learning_rate": 4.862266239621274e-06, "loss": 1.1564, "step": 4414 }, { "epoch": 0.13, "learning_rate": 4.862186383500123e-06, "loss": 1.1534, "step": 4415 }, { "epoch": 0.13, "learning_rate": 4.8621065048920946e-06, "loss": 1.0572, "step": 4416 }, { "epoch": 0.13, "learning_rate": 4.862026603797951e-06, "loss": 1.1417, "step": 4417 }, { "epoch": 0.13, "learning_rate": 4.861946680218451e-06, "loss": 1.2007, "step": 4418 }, { "epoch": 0.13, "learning_rate": 4.861866734154357e-06, "loss": 1.0721, "step": 4419 }, { "epoch": 0.13, "learning_rate": 4.861786765606428e-06, "loss": 1.1708, "step": 4420 }, { "epoch": 0.13, "learning_rate": 4.861706774575427e-06, "loss": 1.2415, "step": 4421 }, { "epoch": 0.13, "learning_rate": 4.861626761062116e-06, "loss": 1.2106, "step": 4422 }, { "epoch": 0.13, "learning_rate": 4.861546725067254e-06, "loss": 1.1274, "step": 4423 }, { "epoch": 0.13, "learning_rate": 4.861466666591606e-06, "loss": 1.2128, "step": 4424 }, { "epoch": 0.13, "learning_rate": 4.861386585635932e-06, "loss": 1.0771, "step": 4425 }, { "epoch": 0.13, "learning_rate": 4.861306482200995e-06, "loss": 1.2227, "step": 4426 }, { "epoch": 0.13, "learning_rate": 4.861226356287557e-06, "loss": 1.23, "step": 4427 }, { "epoch": 0.13, "learning_rate": 4.8611462078963814e-06, "loss": 1.1675, "step": 4428 }, { "epoch": 0.13, "learning_rate": 4.861066037028231e-06, "loss": 1.1146, "step": 4429 }, { "epoch": 0.13, "learning_rate": 4.86098584368387e-06, "loss": 1.2224, "step": 4430 }, { "epoch": 0.13, "learning_rate": 4.8609056278640605e-06, "loss": 1.1702, "step": 4431 }, { "epoch": 0.13, "learning_rate": 4.860825389569566e-06, "loss": 1.1829, "step": 4432 }, { "epoch": 0.13, "learning_rate": 4.860745128801152e-06, "loss": 1.1731, "step": 4433 }, { "epoch": 0.13, "learning_rate": 4.86066484555958e-06, "loss": 1.1046, "step": 4434 }, { "epoch": 0.13, "learning_rate": 4.8605845398456155e-06, "loss": 1.2226, "step": 4435 }, { "epoch": 0.13, "learning_rate": 4.860504211660025e-06, "loss": 1.1555, "step": 4436 }, { "epoch": 0.13, "learning_rate": 4.8604238610035695e-06, "loss": 1.1956, "step": 4437 }, { "epoch": 0.13, "learning_rate": 4.860343487877016e-06, "loss": 1.1645, "step": 4438 }, { "epoch": 0.13, "learning_rate": 4.860263092281129e-06, "loss": 1.0587, "step": 4439 }, { "epoch": 0.13, "learning_rate": 4.8601826742166745e-06, "loss": 1.0851, "step": 4440 }, { "epoch": 0.13, "learning_rate": 4.860102233684417e-06, "loss": 1.2218, "step": 4441 }, { "epoch": 0.13, "learning_rate": 4.8600217706851235e-06, "loss": 1.215, "step": 4442 }, { "epoch": 0.13, "learning_rate": 4.859941285219559e-06, "loss": 1.1956, "step": 4443 }, { "epoch": 0.13, "learning_rate": 4.859860777288491e-06, "loss": 1.1282, "step": 4444 }, { "epoch": 0.13, "learning_rate": 4.859780246892685e-06, "loss": 1.1178, "step": 4445 }, { "epoch": 0.13, "learning_rate": 4.8596996940329066e-06, "loss": 1.2142, "step": 4446 }, { "epoch": 0.13, "learning_rate": 4.859619118709924e-06, "loss": 1.2581, "step": 4447 }, { "epoch": 0.13, "learning_rate": 4.859538520924503e-06, "loss": 1.1049, "step": 4448 }, { "epoch": 0.13, "learning_rate": 4.859457900677413e-06, "loss": 1.0324, "step": 4449 }, { "epoch": 0.13, "learning_rate": 4.8593772579694195e-06, "loss": 1.1653, "step": 4450 }, { "epoch": 0.13, "learning_rate": 4.85929659280129e-06, "loss": 1.1837, "step": 4451 }, { "epoch": 0.13, "learning_rate": 4.859215905173795e-06, "loss": 1.094, "step": 4452 }, { "epoch": 0.13, "learning_rate": 4.8591351950877e-06, "loss": 1.0591, "step": 4453 }, { "epoch": 0.13, "learning_rate": 4.859054462543774e-06, "loss": 1.1578, "step": 4454 }, { "epoch": 0.13, "learning_rate": 4.8589737075427855e-06, "loss": 1.2335, "step": 4455 }, { "epoch": 0.13, "learning_rate": 4.8588929300855035e-06, "loss": 1.0969, "step": 4456 }, { "epoch": 0.13, "learning_rate": 4.858812130172697e-06, "loss": 1.2515, "step": 4457 }, { "epoch": 0.13, "learning_rate": 4.858731307805135e-06, "loss": 1.1943, "step": 4458 }, { "epoch": 0.13, "learning_rate": 4.858650462983587e-06, "loss": 1.1165, "step": 4459 }, { "epoch": 0.13, "learning_rate": 4.858569595708823e-06, "loss": 1.015, "step": 4460 }, { "epoch": 0.13, "learning_rate": 4.858488705981611e-06, "loss": 1.1122, "step": 4461 }, { "epoch": 0.13, "learning_rate": 4.858407793802724e-06, "loss": 1.3078, "step": 4462 }, { "epoch": 0.13, "learning_rate": 4.85832685917293e-06, "loss": 1.1641, "step": 4463 }, { "epoch": 0.13, "learning_rate": 4.858245902093e-06, "loss": 1.2344, "step": 4464 }, { "epoch": 0.13, "learning_rate": 4.8581649225637055e-06, "loss": 1.1028, "step": 4465 }, { "epoch": 0.13, "learning_rate": 4.858083920585816e-06, "loss": 1.1988, "step": 4466 }, { "epoch": 0.13, "learning_rate": 4.858002896160103e-06, "loss": 1.2279, "step": 4467 }, { "epoch": 0.13, "learning_rate": 4.857921849287338e-06, "loss": 1.2271, "step": 4468 }, { "epoch": 0.13, "learning_rate": 4.8578407799682935e-06, "loss": 1.179, "step": 4469 }, { "epoch": 0.13, "learning_rate": 4.85775968820374e-06, "loss": 1.103, "step": 4470 }, { "epoch": 0.13, "learning_rate": 4.85767857399445e-06, "loss": 1.1883, "step": 4471 }, { "epoch": 0.13, "learning_rate": 4.857597437341195e-06, "loss": 1.0715, "step": 4472 }, { "epoch": 0.13, "learning_rate": 4.857516278244748e-06, "loss": 1.0488, "step": 4473 }, { "epoch": 0.13, "learning_rate": 4.857435096705881e-06, "loss": 1.249, "step": 4474 }, { "epoch": 0.13, "learning_rate": 4.857353892725368e-06, "loss": 1.2477, "step": 4475 }, { "epoch": 0.13, "learning_rate": 4.8572726663039804e-06, "loss": 1.1991, "step": 4476 }, { "epoch": 0.13, "learning_rate": 4.857191417442493e-06, "loss": 1.0495, "step": 4477 }, { "epoch": 0.13, "learning_rate": 4.85711014614168e-06, "loss": 1.1307, "step": 4478 }, { "epoch": 0.13, "learning_rate": 4.857028852402311e-06, "loss": 1.1925, "step": 4479 }, { "epoch": 0.13, "learning_rate": 4.856947536225164e-06, "loss": 1.193, "step": 4480 }, { "epoch": 0.13, "learning_rate": 4.856866197611011e-06, "loss": 1.14, "step": 4481 }, { "epoch": 0.14, "learning_rate": 4.856784836560628e-06, "loss": 1.1475, "step": 4482 }, { "epoch": 0.14, "learning_rate": 4.856703453074787e-06, "loss": 1.2462, "step": 4483 }, { "epoch": 0.14, "learning_rate": 4.8566220471542644e-06, "loss": 1.1172, "step": 4484 }, { "epoch": 0.14, "learning_rate": 4.856540618799835e-06, "loss": 1.1169, "step": 4485 }, { "epoch": 0.14, "learning_rate": 4.8564591680122745e-06, "loss": 1.0383, "step": 4486 }, { "epoch": 0.14, "learning_rate": 4.8563776947923565e-06, "loss": 1.1865, "step": 4487 }, { "epoch": 0.14, "learning_rate": 4.856296199140859e-06, "loss": 1.1556, "step": 4488 }, { "epoch": 0.14, "learning_rate": 4.856214681058555e-06, "loss": 1.0911, "step": 4489 }, { "epoch": 0.14, "learning_rate": 4.856133140546224e-06, "loss": 1.1274, "step": 4490 }, { "epoch": 0.14, "learning_rate": 4.856051577604639e-06, "loss": 1.2029, "step": 4491 }, { "epoch": 0.14, "learning_rate": 4.855969992234578e-06, "loss": 1.1223, "step": 4492 }, { "epoch": 0.14, "learning_rate": 4.855888384436817e-06, "loss": 1.2188, "step": 4493 }, { "epoch": 0.14, "learning_rate": 4.855806754212133e-06, "loss": 1.0975, "step": 4494 }, { "epoch": 0.14, "learning_rate": 4.8557251015613044e-06, "loss": 1.1149, "step": 4495 }, { "epoch": 0.14, "learning_rate": 4.855643426485106e-06, "loss": 1.2118, "step": 4496 }, { "epoch": 0.14, "learning_rate": 4.855561728984318e-06, "loss": 1.1785, "step": 4497 }, { "epoch": 0.14, "learning_rate": 4.855480009059717e-06, "loss": 1.167, "step": 4498 }, { "epoch": 0.14, "learning_rate": 4.855398266712079e-06, "loss": 1.2798, "step": 4499 }, { "epoch": 0.14, "learning_rate": 4.855316501942186e-06, "loss": 1.0911, "step": 4500 }, { "epoch": 0.14, "learning_rate": 4.855234714750813e-06, "loss": 1.2394, "step": 4501 }, { "epoch": 0.14, "learning_rate": 4.85515290513874e-06, "loss": 1.1573, "step": 4502 }, { "epoch": 0.14, "learning_rate": 4.8550710731067455e-06, "loss": 1.1541, "step": 4503 }, { "epoch": 0.14, "learning_rate": 4.854989218655608e-06, "loss": 1.0721, "step": 4504 }, { "epoch": 0.14, "learning_rate": 4.8549073417861086e-06, "loss": 1.0446, "step": 4505 }, { "epoch": 0.14, "learning_rate": 4.854825442499025e-06, "loss": 1.1684, "step": 4506 }, { "epoch": 0.14, "learning_rate": 4.8547435207951375e-06, "loss": 1.0671, "step": 4507 }, { "epoch": 0.14, "learning_rate": 4.854661576675226e-06, "loss": 1.1356, "step": 4508 }, { "epoch": 0.14, "learning_rate": 4.854579610140069e-06, "loss": 1.1547, "step": 4509 }, { "epoch": 0.14, "learning_rate": 4.854497621190449e-06, "loss": 1.2061, "step": 4510 }, { "epoch": 0.14, "learning_rate": 4.854415609827145e-06, "loss": 1.2162, "step": 4511 }, { "epoch": 0.14, "learning_rate": 4.854333576050941e-06, "loss": 1.2155, "step": 4512 }, { "epoch": 0.14, "learning_rate": 4.854251519862612e-06, "loss": 1.1639, "step": 4513 }, { "epoch": 0.14, "learning_rate": 4.854169441262944e-06, "loss": 1.1675, "step": 4514 }, { "epoch": 0.14, "learning_rate": 4.854087340252716e-06, "loss": 1.1663, "step": 4515 }, { "epoch": 0.14, "learning_rate": 4.85400521683271e-06, "loss": 1.17, "step": 4516 }, { "epoch": 0.14, "learning_rate": 4.853923071003709e-06, "loss": 1.1302, "step": 4517 }, { "epoch": 0.14, "learning_rate": 4.853840902766493e-06, "loss": 1.1697, "step": 4518 }, { "epoch": 0.14, "learning_rate": 4.853758712121847e-06, "loss": 1.1408, "step": 4519 }, { "epoch": 0.14, "learning_rate": 4.85367649907055e-06, "loss": 1.1485, "step": 4520 }, { "epoch": 0.14, "learning_rate": 4.853594263613387e-06, "loss": 1.1588, "step": 4521 }, { "epoch": 0.14, "learning_rate": 4.85351200575114e-06, "loss": 1.16, "step": 4522 }, { "epoch": 0.14, "learning_rate": 4.853429725484593e-06, "loss": 1.14, "step": 4523 }, { "epoch": 0.14, "learning_rate": 4.853347422814527e-06, "loss": 1.2196, "step": 4524 }, { "epoch": 0.14, "learning_rate": 4.853265097741728e-06, "loss": 1.269, "step": 4525 }, { "epoch": 0.14, "learning_rate": 4.853182750266978e-06, "loss": 1.2081, "step": 4526 }, { "epoch": 0.14, "learning_rate": 4.853100380391062e-06, "loss": 1.059, "step": 4527 }, { "epoch": 0.14, "learning_rate": 4.853017988114763e-06, "loss": 1.0627, "step": 4528 }, { "epoch": 0.14, "learning_rate": 4.852935573438867e-06, "loss": 1.1443, "step": 4529 }, { "epoch": 0.14, "learning_rate": 4.852853136364157e-06, "loss": 1.1971, "step": 4530 }, { "epoch": 0.14, "learning_rate": 4.852770676891419e-06, "loss": 1.2297, "step": 4531 }, { "epoch": 0.14, "learning_rate": 4.8526881950214365e-06, "loss": 1.1468, "step": 4532 }, { "epoch": 0.14, "learning_rate": 4.852605690754996e-06, "loss": 1.1337, "step": 4533 }, { "epoch": 0.14, "learning_rate": 4.852523164092882e-06, "loss": 1.0554, "step": 4534 }, { "epoch": 0.14, "learning_rate": 4.85244061503588e-06, "loss": 1.1623, "step": 4535 }, { "epoch": 0.14, "learning_rate": 4.852358043584777e-06, "loss": 1.1996, "step": 4536 }, { "epoch": 0.14, "learning_rate": 4.852275449740358e-06, "loss": 1.0795, "step": 4537 }, { "epoch": 0.14, "learning_rate": 4.85219283350341e-06, "loss": 1.0931, "step": 4538 }, { "epoch": 0.14, "learning_rate": 4.852110194874718e-06, "loss": 1.2065, "step": 4539 }, { "epoch": 0.14, "learning_rate": 4.852027533855071e-06, "loss": 1.1219, "step": 4540 }, { "epoch": 0.14, "learning_rate": 4.851944850445255e-06, "loss": 1.0545, "step": 4541 }, { "epoch": 0.14, "learning_rate": 4.851862144646056e-06, "loss": 1.117, "step": 4542 }, { "epoch": 0.14, "learning_rate": 4.851779416458262e-06, "loss": 1.1876, "step": 4543 }, { "epoch": 0.14, "learning_rate": 4.8516966658826606e-06, "loss": 1.1403, "step": 4544 }, { "epoch": 0.14, "learning_rate": 4.85161389292004e-06, "loss": 1.1381, "step": 4545 }, { "epoch": 0.14, "learning_rate": 4.851531097571187e-06, "loss": 1.0685, "step": 4546 }, { "epoch": 0.14, "learning_rate": 4.851448279836891e-06, "loss": 1.0857, "step": 4547 }, { "epoch": 0.14, "learning_rate": 4.8513654397179396e-06, "loss": 1.1257, "step": 4548 }, { "epoch": 0.14, "learning_rate": 4.851282577215122e-06, "loss": 1.1656, "step": 4549 }, { "epoch": 0.14, "learning_rate": 4.851199692329227e-06, "loss": 1.1296, "step": 4550 }, { "epoch": 0.14, "learning_rate": 4.8511167850610425e-06, "loss": 1.1892, "step": 4551 }, { "epoch": 0.14, "learning_rate": 4.851033855411359e-06, "loss": 1.1102, "step": 4552 }, { "epoch": 0.14, "learning_rate": 4.850950903380965e-06, "loss": 1.2155, "step": 4553 }, { "epoch": 0.14, "learning_rate": 4.850867928970651e-06, "loss": 1.1611, "step": 4554 }, { "epoch": 0.14, "learning_rate": 4.850784932181207e-06, "loss": 1.1148, "step": 4555 }, { "epoch": 0.14, "learning_rate": 4.850701913013422e-06, "loss": 1.2123, "step": 4556 }, { "epoch": 0.14, "learning_rate": 4.850618871468087e-06, "loss": 1.1778, "step": 4557 }, { "epoch": 0.14, "learning_rate": 4.850535807545993e-06, "loss": 1.1731, "step": 4558 }, { "epoch": 0.14, "learning_rate": 4.850452721247929e-06, "loss": 1.1116, "step": 4559 }, { "epoch": 0.14, "learning_rate": 4.850369612574688e-06, "loss": 1.1765, "step": 4560 }, { "epoch": 0.14, "learning_rate": 4.85028648152706e-06, "loss": 1.2401, "step": 4561 }, { "epoch": 0.14, "learning_rate": 4.850203328105837e-06, "loss": 1.1722, "step": 4562 }, { "epoch": 0.14, "learning_rate": 4.85012015231181e-06, "loss": 1.1832, "step": 4563 }, { "epoch": 0.14, "learning_rate": 4.850036954145771e-06, "loss": 1.049, "step": 4564 }, { "epoch": 0.14, "learning_rate": 4.849953733608513e-06, "loss": 1.1373, "step": 4565 }, { "epoch": 0.14, "learning_rate": 4.849870490700825e-06, "loss": 1.1456, "step": 4566 }, { "epoch": 0.14, "learning_rate": 4.849787225423503e-06, "loss": 1.1874, "step": 4567 }, { "epoch": 0.14, "learning_rate": 4.849703937777338e-06, "loss": 1.1349, "step": 4568 }, { "epoch": 0.14, "learning_rate": 4.849620627763124e-06, "loss": 1.0482, "step": 4569 }, { "epoch": 0.14, "learning_rate": 4.849537295381652e-06, "loss": 1.1722, "step": 4570 }, { "epoch": 0.14, "learning_rate": 4.849453940633717e-06, "loss": 1.1907, "step": 4571 }, { "epoch": 0.14, "learning_rate": 4.849370563520113e-06, "loss": 1.0673, "step": 4572 }, { "epoch": 0.14, "learning_rate": 4.849287164041632e-06, "loss": 1.0638, "step": 4573 }, { "epoch": 0.14, "learning_rate": 4.8492037421990675e-06, "loss": 1.1, "step": 4574 }, { "epoch": 0.14, "learning_rate": 4.8491202979932166e-06, "loss": 1.1943, "step": 4575 }, { "epoch": 0.14, "learning_rate": 4.84903683142487e-06, "loss": 1.1882, "step": 4576 }, { "epoch": 0.14, "learning_rate": 4.848953342494826e-06, "loss": 1.1903, "step": 4577 }, { "epoch": 0.14, "learning_rate": 4.848869831203876e-06, "loss": 1.1727, "step": 4578 }, { "epoch": 0.14, "learning_rate": 4.8487862975528175e-06, "loss": 1.1646, "step": 4579 }, { "epoch": 0.14, "learning_rate": 4.8487027415424445e-06, "loss": 1.2112, "step": 4580 }, { "epoch": 0.14, "learning_rate": 4.848619163173553e-06, "loss": 1.2888, "step": 4581 }, { "epoch": 0.14, "learning_rate": 4.848535562446936e-06, "loss": 1.0527, "step": 4582 }, { "epoch": 0.14, "learning_rate": 4.848451939363394e-06, "loss": 1.2606, "step": 4583 }, { "epoch": 0.14, "learning_rate": 4.848368293923719e-06, "loss": 1.1068, "step": 4584 }, { "epoch": 0.14, "learning_rate": 4.84828462612871e-06, "loss": 1.0586, "step": 4585 }, { "epoch": 0.14, "learning_rate": 4.848200935979162e-06, "loss": 1.0558, "step": 4586 }, { "epoch": 0.14, "learning_rate": 4.848117223475871e-06, "loss": 1.2033, "step": 4587 }, { "epoch": 0.14, "learning_rate": 4.848033488619636e-06, "loss": 1.1409, "step": 4588 }, { "epoch": 0.14, "learning_rate": 4.847949731411253e-06, "loss": 1.1364, "step": 4589 }, { "epoch": 0.14, "learning_rate": 4.847865951851519e-06, "loss": 1.1799, "step": 4590 }, { "epoch": 0.14, "learning_rate": 4.847782149941232e-06, "loss": 1.0159, "step": 4591 }, { "epoch": 0.14, "learning_rate": 4.847698325681191e-06, "loss": 1.0638, "step": 4592 }, { "epoch": 0.14, "learning_rate": 4.847614479072191e-06, "loss": 1.2903, "step": 4593 }, { "epoch": 0.14, "learning_rate": 4.847530610115032e-06, "loss": 1.2347, "step": 4594 }, { "epoch": 0.14, "learning_rate": 4.847446718810512e-06, "loss": 1.2391, "step": 4595 }, { "epoch": 0.14, "learning_rate": 4.84736280515943e-06, "loss": 1.2117, "step": 4596 }, { "epoch": 0.14, "learning_rate": 4.847278869162585e-06, "loss": 1.109, "step": 4597 }, { "epoch": 0.14, "learning_rate": 4.847194910820775e-06, "loss": 1.1164, "step": 4598 }, { "epoch": 0.14, "learning_rate": 4.8471109301348e-06, "loss": 0.9863, "step": 4599 }, { "epoch": 0.14, "learning_rate": 4.84702692710546e-06, "loss": 1.1232, "step": 4600 }, { "epoch": 0.14, "learning_rate": 4.846942901733555e-06, "loss": 1.1487, "step": 4601 }, { "epoch": 0.14, "learning_rate": 4.8468588540198826e-06, "loss": 1.0565, "step": 4602 }, { "epoch": 0.14, "learning_rate": 4.846774783965244e-06, "loss": 1.0584, "step": 4603 }, { "epoch": 0.14, "learning_rate": 4.84669069157044e-06, "loss": 1.1221, "step": 4604 }, { "epoch": 0.14, "learning_rate": 4.84660657683627e-06, "loss": 1.1705, "step": 4605 }, { "epoch": 0.14, "learning_rate": 4.8465224397635365e-06, "loss": 1.2094, "step": 4606 }, { "epoch": 0.14, "learning_rate": 4.84643828035304e-06, "loss": 1.1038, "step": 4607 }, { "epoch": 0.14, "learning_rate": 4.84635409860558e-06, "loss": 1.1515, "step": 4608 }, { "epoch": 0.14, "learning_rate": 4.84626989452196e-06, "loss": 1.0474, "step": 4609 }, { "epoch": 0.14, "learning_rate": 4.846185668102979e-06, "loss": 1.1813, "step": 4610 }, { "epoch": 0.14, "learning_rate": 4.846101419349443e-06, "loss": 1.078, "step": 4611 }, { "epoch": 0.14, "learning_rate": 4.84601714826215e-06, "loss": 1.3174, "step": 4612 }, { "epoch": 0.14, "learning_rate": 4.845932854841903e-06, "loss": 1.015, "step": 4613 }, { "epoch": 0.14, "learning_rate": 4.845848539089505e-06, "loss": 1.1253, "step": 4614 }, { "epoch": 0.14, "learning_rate": 4.845764201005759e-06, "loss": 1.1002, "step": 4615 }, { "epoch": 0.14, "learning_rate": 4.8456798405914685e-06, "loss": 1.0961, "step": 4616 }, { "epoch": 0.14, "learning_rate": 4.845595457847435e-06, "loss": 1.2049, "step": 4617 }, { "epoch": 0.14, "learning_rate": 4.845511052774463e-06, "loss": 1.131, "step": 4618 }, { "epoch": 0.14, "learning_rate": 4.845426625373355e-06, "loss": 1.2173, "step": 4619 }, { "epoch": 0.14, "learning_rate": 4.845342175644914e-06, "loss": 1.1292, "step": 4620 }, { "epoch": 0.14, "learning_rate": 4.845257703589946e-06, "loss": 1.1774, "step": 4621 }, { "epoch": 0.14, "learning_rate": 4.845173209209255e-06, "loss": 1.1329, "step": 4622 }, { "epoch": 0.14, "learning_rate": 4.845088692503644e-06, "loss": 1.2029, "step": 4623 }, { "epoch": 0.14, "learning_rate": 4.845004153473917e-06, "loss": 1.0533, "step": 4624 }, { "epoch": 0.14, "learning_rate": 4.844919592120881e-06, "loss": 1.2843, "step": 4625 }, { "epoch": 0.14, "learning_rate": 4.844835008445339e-06, "loss": 1.1209, "step": 4626 }, { "epoch": 0.14, "learning_rate": 4.844750402448098e-06, "loss": 1.0912, "step": 4627 }, { "epoch": 0.14, "learning_rate": 4.844665774129962e-06, "loss": 1.1429, "step": 4628 }, { "epoch": 0.14, "learning_rate": 4.844581123491737e-06, "loss": 1.1408, "step": 4629 }, { "epoch": 0.14, "learning_rate": 4.844496450534228e-06, "loss": 1.1573, "step": 4630 }, { "epoch": 0.14, "learning_rate": 4.8444117552582435e-06, "loss": 1.3149, "step": 4631 }, { "epoch": 0.14, "learning_rate": 4.844327037664588e-06, "loss": 1.1528, "step": 4632 }, { "epoch": 0.14, "learning_rate": 4.844242297754067e-06, "loss": 1.2094, "step": 4633 }, { "epoch": 0.14, "learning_rate": 4.84415753552749e-06, "loss": 1.0944, "step": 4634 }, { "epoch": 0.14, "learning_rate": 4.8440727509856604e-06, "loss": 1.1196, "step": 4635 }, { "epoch": 0.14, "learning_rate": 4.843987944129388e-06, "loss": 1.1331, "step": 4636 }, { "epoch": 0.14, "learning_rate": 4.8439031149594795e-06, "loss": 1.2115, "step": 4637 }, { "epoch": 0.14, "learning_rate": 4.843818263476742e-06, "loss": 1.2214, "step": 4638 }, { "epoch": 0.14, "learning_rate": 4.843733389681984e-06, "loss": 1.2211, "step": 4639 }, { "epoch": 0.14, "learning_rate": 4.843648493576012e-06, "loss": 1.174, "step": 4640 }, { "epoch": 0.14, "learning_rate": 4.843563575159635e-06, "loss": 1.1158, "step": 4641 }, { "epoch": 0.14, "learning_rate": 4.843478634433663e-06, "loss": 1.1755, "step": 4642 }, { "epoch": 0.14, "learning_rate": 4.843393671398901e-06, "loss": 1.2777, "step": 4643 }, { "epoch": 0.14, "learning_rate": 4.843308686056162e-06, "loss": 1.0038, "step": 4644 }, { "epoch": 0.14, "learning_rate": 4.843223678406252e-06, "loss": 1.1486, "step": 4645 }, { "epoch": 0.14, "learning_rate": 4.84313864844998e-06, "loss": 1.0833, "step": 4646 }, { "epoch": 0.14, "learning_rate": 4.8430535961881574e-06, "loss": 1.1624, "step": 4647 }, { "epoch": 0.14, "learning_rate": 4.842968521621593e-06, "loss": 1.1196, "step": 4648 }, { "epoch": 0.14, "learning_rate": 4.842883424751097e-06, "loss": 1.194, "step": 4649 }, { "epoch": 0.14, "learning_rate": 4.842798305577479e-06, "loss": 1.2164, "step": 4650 }, { "epoch": 0.14, "learning_rate": 4.842713164101549e-06, "loss": 1.1694, "step": 4651 }, { "epoch": 0.14, "learning_rate": 4.842628000324119e-06, "loss": 1.1804, "step": 4652 }, { "epoch": 0.14, "learning_rate": 4.842542814245997e-06, "loss": 1.229, "step": 4653 }, { "epoch": 0.14, "learning_rate": 4.842457605867997e-06, "loss": 1.0774, "step": 4654 }, { "epoch": 0.14, "learning_rate": 4.842372375190929e-06, "loss": 1.2008, "step": 4655 }, { "epoch": 0.14, "learning_rate": 4.842287122215603e-06, "loss": 1.2784, "step": 4656 }, { "epoch": 0.14, "learning_rate": 4.8422018469428325e-06, "loss": 1.2966, "step": 4657 }, { "epoch": 0.14, "learning_rate": 4.842116549373428e-06, "loss": 1.1238, "step": 4658 }, { "epoch": 0.14, "learning_rate": 4.842031229508202e-06, "loss": 1.1004, "step": 4659 }, { "epoch": 0.14, "learning_rate": 4.841945887347967e-06, "loss": 1.0731, "step": 4660 }, { "epoch": 0.14, "learning_rate": 4.841860522893534e-06, "loss": 1.198, "step": 4661 }, { "epoch": 0.14, "learning_rate": 4.841775136145719e-06, "loss": 1.0816, "step": 4662 }, { "epoch": 0.14, "learning_rate": 4.8416897271053305e-06, "loss": 1.1332, "step": 4663 }, { "epoch": 0.14, "learning_rate": 4.841604295773185e-06, "loss": 1.1703, "step": 4664 }, { "epoch": 0.14, "learning_rate": 4.841518842150092e-06, "loss": 1.1851, "step": 4665 }, { "epoch": 0.14, "learning_rate": 4.8414333662368694e-06, "loss": 1.1062, "step": 4666 }, { "epoch": 0.14, "learning_rate": 4.841347868034329e-06, "loss": 1.2375, "step": 4667 }, { "epoch": 0.14, "learning_rate": 4.841262347543283e-06, "loss": 1.2281, "step": 4668 }, { "epoch": 0.14, "learning_rate": 4.841176804764548e-06, "loss": 1.03, "step": 4669 }, { "epoch": 0.14, "learning_rate": 4.841091239698937e-06, "loss": 1.1829, "step": 4670 }, { "epoch": 0.14, "learning_rate": 4.841005652347266e-06, "loss": 1.2353, "step": 4671 }, { "epoch": 0.14, "learning_rate": 4.840920042710347e-06, "loss": 1.2153, "step": 4672 }, { "epoch": 0.14, "learning_rate": 4.840834410788998e-06, "loss": 1.2988, "step": 4673 }, { "epoch": 0.14, "learning_rate": 4.840748756584031e-06, "loss": 1.309, "step": 4674 }, { "epoch": 0.14, "learning_rate": 4.840663080096265e-06, "loss": 1.2615, "step": 4675 }, { "epoch": 0.14, "learning_rate": 4.840577381326513e-06, "loss": 1.1895, "step": 4676 }, { "epoch": 0.14, "learning_rate": 4.840491660275593e-06, "loss": 1.1465, "step": 4677 }, { "epoch": 0.14, "learning_rate": 4.840405916944317e-06, "loss": 1.1753, "step": 4678 }, { "epoch": 0.14, "learning_rate": 4.8403201513335065e-06, "loss": 1.1925, "step": 4679 }, { "epoch": 0.14, "learning_rate": 4.840234363443973e-06, "loss": 1.2009, "step": 4680 }, { "epoch": 0.14, "learning_rate": 4.840148553276537e-06, "loss": 1.0724, "step": 4681 }, { "epoch": 0.14, "learning_rate": 4.840062720832013e-06, "loss": 1.1461, "step": 4682 }, { "epoch": 0.14, "learning_rate": 4.83997686611122e-06, "loss": 1.0833, "step": 4683 }, { "epoch": 0.14, "learning_rate": 4.839890989114972e-06, "loss": 1.1687, "step": 4684 }, { "epoch": 0.14, "learning_rate": 4.83980508984409e-06, "loss": 1.199, "step": 4685 }, { "epoch": 0.14, "learning_rate": 4.839719168299392e-06, "loss": 1.1369, "step": 4686 }, { "epoch": 0.14, "learning_rate": 4.839633224481692e-06, "loss": 1.1998, "step": 4687 }, { "epoch": 0.14, "learning_rate": 4.839547258391812e-06, "loss": 1.3625, "step": 4688 }, { "epoch": 0.14, "learning_rate": 4.839461270030568e-06, "loss": 1.1862, "step": 4689 }, { "epoch": 0.14, "learning_rate": 4.83937525939878e-06, "loss": 1.1451, "step": 4690 }, { "epoch": 0.14, "learning_rate": 4.839289226497266e-06, "loss": 1.0756, "step": 4691 }, { "epoch": 0.14, "learning_rate": 4.839203171326845e-06, "loss": 1.2166, "step": 4692 }, { "epoch": 0.14, "learning_rate": 4.839117093888337e-06, "loss": 1.1453, "step": 4693 }, { "epoch": 0.14, "learning_rate": 4.8390309941825595e-06, "loss": 1.1298, "step": 4694 }, { "epoch": 0.14, "learning_rate": 4.838944872210335e-06, "loss": 1.2223, "step": 4695 }, { "epoch": 0.14, "learning_rate": 4.8388587279724805e-06, "loss": 1.1928, "step": 4696 }, { "epoch": 0.14, "learning_rate": 4.838772561469819e-06, "loss": 1.1726, "step": 4697 }, { "epoch": 0.14, "learning_rate": 4.838686372703168e-06, "loss": 1.0573, "step": 4698 }, { "epoch": 0.14, "learning_rate": 4.8386001616733495e-06, "loss": 1.2316, "step": 4699 }, { "epoch": 0.14, "learning_rate": 4.838513928381183e-06, "loss": 1.0742, "step": 4700 }, { "epoch": 0.14, "learning_rate": 4.838427672827491e-06, "loss": 1.2354, "step": 4701 }, { "epoch": 0.14, "learning_rate": 4.838341395013093e-06, "loss": 1.2188, "step": 4702 }, { "epoch": 0.14, "learning_rate": 4.838255094938811e-06, "loss": 1.1667, "step": 4703 }, { "epoch": 0.14, "learning_rate": 4.838168772605467e-06, "loss": 1.0923, "step": 4704 }, { "epoch": 0.14, "learning_rate": 4.8380824280138825e-06, "loss": 1.1849, "step": 4705 }, { "epoch": 0.14, "learning_rate": 4.837996061164879e-06, "loss": 1.2236, "step": 4706 }, { "epoch": 0.14, "learning_rate": 4.83790967205928e-06, "loss": 1.1918, "step": 4707 }, { "epoch": 0.14, "learning_rate": 4.837823260697907e-06, "loss": 1.0723, "step": 4708 }, { "epoch": 0.14, "learning_rate": 4.837736827081581e-06, "loss": 1.173, "step": 4709 }, { "epoch": 0.14, "learning_rate": 4.837650371211127e-06, "loss": 1.2003, "step": 4710 }, { "epoch": 0.14, "learning_rate": 4.8375638930873675e-06, "loss": 1.1868, "step": 4711 }, { "epoch": 0.14, "learning_rate": 4.837477392711125e-06, "loss": 1.2026, "step": 4712 }, { "epoch": 0.14, "learning_rate": 4.837390870083224e-06, "loss": 1.0708, "step": 4713 }, { "epoch": 0.14, "learning_rate": 4.837304325204488e-06, "loss": 1.1433, "step": 4714 }, { "epoch": 0.14, "learning_rate": 4.8372177580757394e-06, "loss": 1.0849, "step": 4715 }, { "epoch": 0.14, "learning_rate": 4.837131168697805e-06, "loss": 1.085, "step": 4716 }, { "epoch": 0.14, "learning_rate": 4.837044557071507e-06, "loss": 1.187, "step": 4717 }, { "epoch": 0.14, "learning_rate": 4.836957923197669e-06, "loss": 1.2571, "step": 4718 }, { "epoch": 0.14, "learning_rate": 4.8368712670771176e-06, "loss": 1.2086, "step": 4719 }, { "epoch": 0.14, "learning_rate": 4.836784588710678e-06, "loss": 1.1207, "step": 4720 }, { "epoch": 0.14, "learning_rate": 4.836697888099175e-06, "loss": 1.1705, "step": 4721 }, { "epoch": 0.14, "learning_rate": 4.836611165243432e-06, "loss": 1.1424, "step": 4722 }, { "epoch": 0.14, "learning_rate": 4.836524420144276e-06, "loss": 1.1302, "step": 4723 }, { "epoch": 0.14, "learning_rate": 4.836437652802534e-06, "loss": 1.1801, "step": 4724 }, { "epoch": 0.14, "learning_rate": 4.83635086321903e-06, "loss": 1.1849, "step": 4725 }, { "epoch": 0.14, "learning_rate": 4.836264051394592e-06, "loss": 1.1172, "step": 4726 }, { "epoch": 0.14, "learning_rate": 4.836177217330045e-06, "loss": 1.1988, "step": 4727 }, { "epoch": 0.14, "learning_rate": 4.836090361026216e-06, "loss": 1.1881, "step": 4728 }, { "epoch": 0.14, "learning_rate": 4.836003482483931e-06, "loss": 1.1401, "step": 4729 }, { "epoch": 0.14, "learning_rate": 4.835916581704019e-06, "loss": 1.1794, "step": 4730 }, { "epoch": 0.14, "learning_rate": 4.8358296586873056e-06, "loss": 1.136, "step": 4731 }, { "epoch": 0.14, "learning_rate": 4.835742713434619e-06, "loss": 1.1617, "step": 4732 }, { "epoch": 0.14, "learning_rate": 4.835655745946787e-06, "loss": 1.0214, "step": 4733 }, { "epoch": 0.14, "learning_rate": 4.835568756224636e-06, "loss": 1.2534, "step": 4734 }, { "epoch": 0.14, "learning_rate": 4.835481744268996e-06, "loss": 1.2228, "step": 4735 }, { "epoch": 0.14, "learning_rate": 4.835394710080695e-06, "loss": 1.1185, "step": 4736 }, { "epoch": 0.14, "learning_rate": 4.835307653660561e-06, "loss": 1.0853, "step": 4737 }, { "epoch": 0.14, "learning_rate": 4.835220575009423e-06, "loss": 1.1703, "step": 4738 }, { "epoch": 0.14, "learning_rate": 4.835133474128109e-06, "loss": 1.1093, "step": 4739 }, { "epoch": 0.14, "learning_rate": 4.835046351017449e-06, "loss": 1.1158, "step": 4740 }, { "epoch": 0.14, "learning_rate": 4.834959205678273e-06, "loss": 1.0523, "step": 4741 }, { "epoch": 0.14, "learning_rate": 4.83487203811141e-06, "loss": 1.2347, "step": 4742 }, { "epoch": 0.14, "learning_rate": 4.83478484831769e-06, "loss": 1.2378, "step": 4743 }, { "epoch": 0.14, "learning_rate": 4.834697636297941e-06, "loss": 1.1355, "step": 4744 }, { "epoch": 0.14, "learning_rate": 4.834610402052997e-06, "loss": 1.2009, "step": 4745 }, { "epoch": 0.14, "learning_rate": 4.834523145583685e-06, "loss": 1.1351, "step": 4746 }, { "epoch": 0.14, "learning_rate": 4.834435866890837e-06, "loss": 1.0809, "step": 4747 }, { "epoch": 0.14, "learning_rate": 4.834348565975285e-06, "loss": 1.2297, "step": 4748 }, { "epoch": 0.14, "learning_rate": 4.834261242837858e-06, "loss": 1.28, "step": 4749 }, { "epoch": 0.14, "learning_rate": 4.834173897479388e-06, "loss": 1.2218, "step": 4750 }, { "epoch": 0.14, "learning_rate": 4.8340865299007075e-06, "loss": 1.1367, "step": 4751 }, { "epoch": 0.14, "learning_rate": 4.833999140102647e-06, "loss": 1.1096, "step": 4752 }, { "epoch": 0.14, "learning_rate": 4.833911728086039e-06, "loss": 1.074, "step": 4753 }, { "epoch": 0.14, "learning_rate": 4.8338242938517155e-06, "loss": 1.2277, "step": 4754 }, { "epoch": 0.14, "learning_rate": 4.833736837400508e-06, "loss": 1.1371, "step": 4755 }, { "epoch": 0.14, "learning_rate": 4.83364935873325e-06, "loss": 1.2201, "step": 4756 }, { "epoch": 0.14, "learning_rate": 4.833561857850774e-06, "loss": 1.223, "step": 4757 }, { "epoch": 0.14, "learning_rate": 4.833474334753913e-06, "loss": 1.2225, "step": 4758 }, { "epoch": 0.14, "learning_rate": 4.8333867894435e-06, "loss": 1.064, "step": 4759 }, { "epoch": 0.14, "learning_rate": 4.8332992219203695e-06, "loss": 1.1245, "step": 4760 }, { "epoch": 0.14, "learning_rate": 4.833211632185354e-06, "loss": 1.1398, "step": 4761 }, { "epoch": 0.14, "learning_rate": 4.8331240202392875e-06, "loss": 1.1443, "step": 4762 }, { "epoch": 0.14, "learning_rate": 4.833036386083002e-06, "loss": 1.0903, "step": 4763 }, { "epoch": 0.14, "learning_rate": 4.832948729717336e-06, "loss": 1.2303, "step": 4764 }, { "epoch": 0.14, "learning_rate": 4.832861051143121e-06, "loss": 1.0753, "step": 4765 }, { "epoch": 0.14, "learning_rate": 4.832773350361192e-06, "loss": 1.0717, "step": 4766 }, { "epoch": 0.14, "learning_rate": 4.8326856273723845e-06, "loss": 1.1832, "step": 4767 }, { "epoch": 0.14, "learning_rate": 4.832597882177533e-06, "loss": 1.2881, "step": 4768 }, { "epoch": 0.14, "learning_rate": 4.832510114777474e-06, "loss": 1.2025, "step": 4769 }, { "epoch": 0.14, "learning_rate": 4.832422325173041e-06, "loss": 1.1981, "step": 4770 }, { "epoch": 0.14, "learning_rate": 4.832334513365071e-06, "loss": 1.1319, "step": 4771 }, { "epoch": 0.14, "learning_rate": 4.832246679354401e-06, "loss": 1.1275, "step": 4772 }, { "epoch": 0.14, "learning_rate": 4.832158823141864e-06, "loss": 1.1152, "step": 4773 }, { "epoch": 0.14, "learning_rate": 4.8320709447283e-06, "loss": 1.1805, "step": 4774 }, { "epoch": 0.14, "learning_rate": 4.831983044114542e-06, "loss": 1.0646, "step": 4775 }, { "epoch": 0.14, "learning_rate": 4.83189512130143e-06, "loss": 1.155, "step": 4776 }, { "epoch": 0.14, "learning_rate": 4.831807176289799e-06, "loss": 1.0905, "step": 4777 }, { "epoch": 0.14, "learning_rate": 4.8317192090804854e-06, "loss": 1.0764, "step": 4778 }, { "epoch": 0.14, "learning_rate": 4.83163121967433e-06, "loss": 1.1705, "step": 4779 }, { "epoch": 0.14, "learning_rate": 4.831543208072167e-06, "loss": 1.2847, "step": 4780 }, { "epoch": 0.14, "learning_rate": 4.831455174274836e-06, "loss": 1.2447, "step": 4781 }, { "epoch": 0.14, "learning_rate": 4.8313671182831745e-06, "loss": 1.0786, "step": 4782 }, { "epoch": 0.14, "learning_rate": 4.831279040098021e-06, "loss": 1.1259, "step": 4783 }, { "epoch": 0.14, "learning_rate": 4.831190939720214e-06, "loss": 1.1417, "step": 4784 }, { "epoch": 0.14, "learning_rate": 4.831102817150591e-06, "loss": 1.1601, "step": 4785 }, { "epoch": 0.14, "learning_rate": 4.831014672389993e-06, "loss": 1.2255, "step": 4786 }, { "epoch": 0.14, "learning_rate": 4.830926505439258e-06, "loss": 1.2244, "step": 4787 }, { "epoch": 0.14, "learning_rate": 4.830838316299225e-06, "loss": 1.1673, "step": 4788 }, { "epoch": 0.14, "learning_rate": 4.830750104970734e-06, "loss": 1.2245, "step": 4789 }, { "epoch": 0.14, "learning_rate": 4.830661871454624e-06, "loss": 1.1392, "step": 4790 }, { "epoch": 0.14, "learning_rate": 4.8305736157517355e-06, "loss": 1.1854, "step": 4791 }, { "epoch": 0.14, "learning_rate": 4.830485337862909e-06, "loss": 1.1916, "step": 4792 }, { "epoch": 0.14, "learning_rate": 4.830397037788984e-06, "loss": 1.2249, "step": 4793 }, { "epoch": 0.14, "learning_rate": 4.830308715530802e-06, "loss": 1.184, "step": 4794 }, { "epoch": 0.14, "learning_rate": 4.830220371089204e-06, "loss": 1.0767, "step": 4795 }, { "epoch": 0.14, "learning_rate": 4.830132004465029e-06, "loss": 1.1578, "step": 4796 }, { "epoch": 0.14, "learning_rate": 4.83004361565912e-06, "loss": 1.0778, "step": 4797 }, { "epoch": 0.14, "learning_rate": 4.829955204672318e-06, "loss": 1.235, "step": 4798 }, { "epoch": 0.14, "learning_rate": 4.829866771505465e-06, "loss": 1.2532, "step": 4799 }, { "epoch": 0.14, "learning_rate": 4.829778316159402e-06, "loss": 1.0303, "step": 4800 }, { "epoch": 0.14, "learning_rate": 4.829689838634972e-06, "loss": 1.1094, "step": 4801 }, { "epoch": 0.14, "learning_rate": 4.829601338933016e-06, "loss": 1.106, "step": 4802 }, { "epoch": 0.14, "learning_rate": 4.829512817054377e-06, "loss": 1.0918, "step": 4803 }, { "epoch": 0.14, "learning_rate": 4.829424272999899e-06, "loss": 1.1361, "step": 4804 }, { "epoch": 0.14, "learning_rate": 4.829335706770423e-06, "loss": 1.1678, "step": 4805 }, { "epoch": 0.14, "learning_rate": 4.8292471183667935e-06, "loss": 1.2606, "step": 4806 }, { "epoch": 0.14, "learning_rate": 4.829158507789853e-06, "loss": 1.1961, "step": 4807 }, { "epoch": 0.14, "learning_rate": 4.829069875040445e-06, "loss": 1.111, "step": 4808 }, { "epoch": 0.14, "learning_rate": 4.828981220119414e-06, "loss": 1.1446, "step": 4809 }, { "epoch": 0.14, "learning_rate": 4.828892543027603e-06, "loss": 1.1014, "step": 4810 }, { "epoch": 0.14, "learning_rate": 4.828803843765857e-06, "loss": 1.1323, "step": 4811 }, { "epoch": 0.14, "learning_rate": 4.82871512233502e-06, "loss": 1.1598, "step": 4812 }, { "epoch": 0.14, "learning_rate": 4.8286263787359365e-06, "loss": 0.9788, "step": 4813 }, { "epoch": 0.15, "learning_rate": 4.828537612969451e-06, "loss": 1.2153, "step": 4814 }, { "epoch": 0.15, "learning_rate": 4.8284488250364095e-06, "loss": 1.1257, "step": 4815 }, { "epoch": 0.15, "learning_rate": 4.828360014937656e-06, "loss": 1.1124, "step": 4816 }, { "epoch": 0.15, "learning_rate": 4.828271182674037e-06, "loss": 1.2319, "step": 4817 }, { "epoch": 0.15, "learning_rate": 4.828182328246398e-06, "loss": 1.1606, "step": 4818 }, { "epoch": 0.15, "learning_rate": 4.828093451655584e-06, "loss": 1.0231, "step": 4819 }, { "epoch": 0.15, "learning_rate": 4.828004552902441e-06, "loss": 1.1147, "step": 4820 }, { "epoch": 0.15, "learning_rate": 4.827915631987816e-06, "loss": 1.0895, "step": 4821 }, { "epoch": 0.15, "learning_rate": 4.827826688912556e-06, "loss": 1.1294, "step": 4822 }, { "epoch": 0.15, "learning_rate": 4.827737723677507e-06, "loss": 1.178, "step": 4823 }, { "epoch": 0.15, "learning_rate": 4.827648736283515e-06, "loss": 1.1162, "step": 4824 }, { "epoch": 0.15, "learning_rate": 4.82755972673143e-06, "loss": 1.1953, "step": 4825 }, { "epoch": 0.15, "learning_rate": 4.827470695022097e-06, "loss": 1.1404, "step": 4826 }, { "epoch": 0.15, "learning_rate": 4.827381641156363e-06, "loss": 1.0623, "step": 4827 }, { "epoch": 0.15, "learning_rate": 4.827292565135076e-06, "loss": 1.2498, "step": 4828 }, { "epoch": 0.15, "learning_rate": 4.827203466959086e-06, "loss": 1.2373, "step": 4829 }, { "epoch": 0.15, "learning_rate": 4.827114346629239e-06, "loss": 1.1569, "step": 4830 }, { "epoch": 0.15, "learning_rate": 4.827025204146384e-06, "loss": 1.144, "step": 4831 }, { "epoch": 0.15, "learning_rate": 4.826936039511371e-06, "loss": 1.1399, "step": 4832 }, { "epoch": 0.15, "learning_rate": 4.826846852725047e-06, "loss": 1.1353, "step": 4833 }, { "epoch": 0.15, "learning_rate": 4.8267576437882614e-06, "loss": 1.0605, "step": 4834 }, { "epoch": 0.15, "learning_rate": 4.8266684127018634e-06, "loss": 1.1865, "step": 4835 }, { "epoch": 0.15, "learning_rate": 4.826579159466703e-06, "loss": 1.1809, "step": 4836 }, { "epoch": 0.15, "learning_rate": 4.82648988408363e-06, "loss": 1.2192, "step": 4837 }, { "epoch": 0.15, "learning_rate": 4.826400586553493e-06, "loss": 1.2599, "step": 4838 }, { "epoch": 0.15, "learning_rate": 4.826311266877143e-06, "loss": 1.2128, "step": 4839 }, { "epoch": 0.15, "learning_rate": 4.82622192505543e-06, "loss": 1.0716, "step": 4840 }, { "epoch": 0.15, "learning_rate": 4.826132561089205e-06, "loss": 1.183, "step": 4841 }, { "epoch": 0.15, "learning_rate": 4.8260431749793185e-06, "loss": 1.1667, "step": 4842 }, { "epoch": 0.15, "learning_rate": 4.825953766726621e-06, "loss": 1.3334, "step": 4843 }, { "epoch": 0.15, "learning_rate": 4.825864336331964e-06, "loss": 1.2532, "step": 4844 }, { "epoch": 0.15, "learning_rate": 4.825774883796198e-06, "loss": 1.1827, "step": 4845 }, { "epoch": 0.15, "learning_rate": 4.825685409120176e-06, "loss": 1.1385, "step": 4846 }, { "epoch": 0.15, "learning_rate": 4.825595912304749e-06, "loss": 1.1396, "step": 4847 }, { "epoch": 0.15, "learning_rate": 4.825506393350769e-06, "loss": 1.1131, "step": 4848 }, { "epoch": 0.15, "learning_rate": 4.825416852259088e-06, "loss": 1.1941, "step": 4849 }, { "epoch": 0.15, "learning_rate": 4.825327289030558e-06, "loss": 1.1577, "step": 4850 }, { "epoch": 0.15, "learning_rate": 4.825237703666032e-06, "loss": 1.0801, "step": 4851 }, { "epoch": 0.15, "learning_rate": 4.825148096166365e-06, "loss": 1.1577, "step": 4852 }, { "epoch": 0.15, "learning_rate": 4.825058466532405e-06, "loss": 1.0214, "step": 4853 }, { "epoch": 0.15, "learning_rate": 4.82496881476501e-06, "loss": 1.1328, "step": 4854 }, { "epoch": 0.15, "learning_rate": 4.824879140865031e-06, "loss": 1.2075, "step": 4855 }, { "epoch": 0.15, "learning_rate": 4.824789444833323e-06, "loss": 1.1596, "step": 4856 }, { "epoch": 0.15, "learning_rate": 4.824699726670738e-06, "loss": 1.214, "step": 4857 }, { "epoch": 0.15, "learning_rate": 4.824609986378132e-06, "loss": 1.145, "step": 4858 }, { "epoch": 0.15, "learning_rate": 4.824520223956358e-06, "loss": 1.1349, "step": 4859 }, { "epoch": 0.15, "learning_rate": 4.824430439406272e-06, "loss": 1.1147, "step": 4860 }, { "epoch": 0.15, "learning_rate": 4.824340632728727e-06, "loss": 1.208, "step": 4861 }, { "epoch": 0.15, "learning_rate": 4.824250803924578e-06, "loss": 1.2114, "step": 4862 }, { "epoch": 0.15, "learning_rate": 4.824160952994682e-06, "loss": 1.2214, "step": 4863 }, { "epoch": 0.15, "learning_rate": 4.824071079939892e-06, "loss": 1.2181, "step": 4864 }, { "epoch": 0.15, "learning_rate": 4.823981184761065e-06, "loss": 1.0046, "step": 4865 }, { "epoch": 0.15, "learning_rate": 4.823891267459057e-06, "loss": 1.1766, "step": 4866 }, { "epoch": 0.15, "learning_rate": 4.823801328034723e-06, "loss": 1.1367, "step": 4867 }, { "epoch": 0.15, "learning_rate": 4.823711366488919e-06, "loss": 1.1235, "step": 4868 }, { "epoch": 0.15, "learning_rate": 4.823621382822503e-06, "loss": 1.1583, "step": 4869 }, { "epoch": 0.15, "learning_rate": 4.8235313770363295e-06, "loss": 1.1982, "step": 4870 }, { "epoch": 0.15, "learning_rate": 4.823441349131257e-06, "loss": 1.076, "step": 4871 }, { "epoch": 0.15, "learning_rate": 4.8233512991081414e-06, "loss": 1.1746, "step": 4872 }, { "epoch": 0.15, "learning_rate": 4.82326122696784e-06, "loss": 1.1082, "step": 4873 }, { "epoch": 0.15, "learning_rate": 4.823171132711212e-06, "loss": 1.2612, "step": 4874 }, { "epoch": 0.15, "learning_rate": 4.823081016339113e-06, "loss": 1.2511, "step": 4875 }, { "epoch": 0.15, "learning_rate": 4.8229908778524015e-06, "loss": 1.2034, "step": 4876 }, { "epoch": 0.15, "learning_rate": 4.822900717251935e-06, "loss": 1.1731, "step": 4877 }, { "epoch": 0.15, "learning_rate": 4.822810534538573e-06, "loss": 1.1119, "step": 4878 }, { "epoch": 0.15, "learning_rate": 4.822720329713174e-06, "loss": 1.1327, "step": 4879 }, { "epoch": 0.15, "learning_rate": 4.822630102776596e-06, "loss": 1.2001, "step": 4880 }, { "epoch": 0.15, "learning_rate": 4.822539853729697e-06, "loss": 1.1786, "step": 4881 }, { "epoch": 0.15, "learning_rate": 4.822449582573337e-06, "loss": 1.0527, "step": 4882 }, { "epoch": 0.15, "learning_rate": 4.822359289308377e-06, "loss": 1.0919, "step": 4883 }, { "epoch": 0.15, "learning_rate": 4.8222689739356745e-06, "loss": 1.2002, "step": 4884 }, { "epoch": 0.15, "learning_rate": 4.822178636456089e-06, "loss": 1.1569, "step": 4885 }, { "epoch": 0.15, "learning_rate": 4.822088276870482e-06, "loss": 1.2329, "step": 4886 }, { "epoch": 0.15, "learning_rate": 4.821997895179713e-06, "loss": 1.1447, "step": 4887 }, { "epoch": 0.15, "learning_rate": 4.821907491384642e-06, "loss": 1.1481, "step": 4888 }, { "epoch": 0.15, "learning_rate": 4.8218170654861305e-06, "loss": 1.1714, "step": 4889 }, { "epoch": 0.15, "learning_rate": 4.821726617485038e-06, "loss": 1.1259, "step": 4890 }, { "epoch": 0.15, "learning_rate": 4.821636147382227e-06, "loss": 1.0792, "step": 4891 }, { "epoch": 0.15, "learning_rate": 4.8215456551785575e-06, "loss": 1.1902, "step": 4892 }, { "epoch": 0.15, "learning_rate": 4.8214551408748925e-06, "loss": 1.2142, "step": 4893 }, { "epoch": 0.15, "learning_rate": 4.821364604472091e-06, "loss": 1.1619, "step": 4894 }, { "epoch": 0.15, "learning_rate": 4.821274045971017e-06, "loss": 1.1453, "step": 4895 }, { "epoch": 0.15, "learning_rate": 4.821183465372533e-06, "loss": 1.182, "step": 4896 }, { "epoch": 0.15, "learning_rate": 4.821092862677499e-06, "loss": 1.09, "step": 4897 }, { "epoch": 0.15, "learning_rate": 4.82100223788678e-06, "loss": 1.1368, "step": 4898 }, { "epoch": 0.15, "learning_rate": 4.820911591001237e-06, "loss": 1.2705, "step": 4899 }, { "epoch": 0.15, "learning_rate": 4.820820922021733e-06, "loss": 1.1595, "step": 4900 }, { "epoch": 0.15, "learning_rate": 4.820730230949132e-06, "loss": 1.1378, "step": 4901 }, { "epoch": 0.15, "learning_rate": 4.820639517784298e-06, "loss": 1.1949, "step": 4902 }, { "epoch": 0.15, "learning_rate": 4.820548782528092e-06, "loss": 1.0546, "step": 4903 }, { "epoch": 0.15, "learning_rate": 4.820458025181379e-06, "loss": 1.1942, "step": 4904 }, { "epoch": 0.15, "learning_rate": 4.820367245745024e-06, "loss": 1.291, "step": 4905 }, { "epoch": 0.15, "learning_rate": 4.8202764442198905e-06, "loss": 1.2822, "step": 4906 }, { "epoch": 0.15, "learning_rate": 4.820185620606842e-06, "loss": 1.1308, "step": 4907 }, { "epoch": 0.15, "learning_rate": 4.820094774906744e-06, "loss": 1.1511, "step": 4908 }, { "epoch": 0.15, "learning_rate": 4.820003907120461e-06, "loss": 1.0804, "step": 4909 }, { "epoch": 0.15, "learning_rate": 4.819913017248859e-06, "loss": 1.2262, "step": 4910 }, { "epoch": 0.15, "learning_rate": 4.8198221052928015e-06, "loss": 1.1371, "step": 4911 }, { "epoch": 0.15, "learning_rate": 4.819731171253156e-06, "loss": 1.1498, "step": 4912 }, { "epoch": 0.15, "learning_rate": 4.8196402151307856e-06, "loss": 1.0912, "step": 4913 }, { "epoch": 0.15, "learning_rate": 4.819549236926558e-06, "loss": 1.153, "step": 4914 }, { "epoch": 0.15, "learning_rate": 4.819458236641339e-06, "loss": 1.0759, "step": 4915 }, { "epoch": 0.15, "learning_rate": 4.819367214275994e-06, "loss": 1.1168, "step": 4916 }, { "epoch": 0.15, "learning_rate": 4.819276169831391e-06, "loss": 1.063, "step": 4917 }, { "epoch": 0.15, "learning_rate": 4.819185103308396e-06, "loss": 1.3358, "step": 4918 }, { "epoch": 0.15, "learning_rate": 4.819094014707875e-06, "loss": 1.2311, "step": 4919 }, { "epoch": 0.15, "learning_rate": 4.819002904030696e-06, "loss": 1.2134, "step": 4920 }, { "epoch": 0.15, "learning_rate": 4.818911771277727e-06, "loss": 1.1468, "step": 4921 }, { "epoch": 0.15, "learning_rate": 4.8188206164498335e-06, "loss": 1.1392, "step": 4922 }, { "epoch": 0.15, "learning_rate": 4.818729439547885e-06, "loss": 1.1586, "step": 4923 }, { "epoch": 0.15, "learning_rate": 4.81863824057275e-06, "loss": 1.2313, "step": 4924 }, { "epoch": 0.15, "learning_rate": 4.818547019525295e-06, "loss": 1.1879, "step": 4925 }, { "epoch": 0.15, "learning_rate": 4.818455776406388e-06, "loss": 1.2172, "step": 4926 }, { "epoch": 0.15, "learning_rate": 4.8183645112169e-06, "loss": 1.2459, "step": 4927 }, { "epoch": 0.15, "learning_rate": 4.818273223957698e-06, "loss": 1.043, "step": 4928 }, { "epoch": 0.15, "learning_rate": 4.818181914629651e-06, "loss": 1.1876, "step": 4929 }, { "epoch": 0.15, "learning_rate": 4.8180905832336285e-06, "loss": 1.0429, "step": 4930 }, { "epoch": 0.15, "learning_rate": 4.817999229770502e-06, "loss": 1.2488, "step": 4931 }, { "epoch": 0.15, "learning_rate": 4.817907854241137e-06, "loss": 1.0491, "step": 4932 }, { "epoch": 0.15, "learning_rate": 4.817816456646406e-06, "loss": 1.0366, "step": 4933 }, { "epoch": 0.15, "learning_rate": 4.817725036987179e-06, "loss": 1.171, "step": 4934 }, { "epoch": 0.15, "learning_rate": 4.817633595264326e-06, "loss": 1.2132, "step": 4935 }, { "epoch": 0.15, "learning_rate": 4.817542131478717e-06, "loss": 1.1609, "step": 4936 }, { "epoch": 0.15, "learning_rate": 4.817450645631223e-06, "loss": 1.2845, "step": 4937 }, { "epoch": 0.15, "learning_rate": 4.817359137722716e-06, "loss": 1.1595, "step": 4938 }, { "epoch": 0.15, "learning_rate": 4.8172676077540655e-06, "loss": 1.1937, "step": 4939 }, { "epoch": 0.15, "learning_rate": 4.817176055726143e-06, "loss": 1.2899, "step": 4940 }, { "epoch": 0.15, "learning_rate": 4.817084481639821e-06, "loss": 1.1319, "step": 4941 }, { "epoch": 0.15, "learning_rate": 4.81699288549597e-06, "loss": 1.2631, "step": 4942 }, { "epoch": 0.15, "learning_rate": 4.816901267295463e-06, "loss": 1.189, "step": 4943 }, { "epoch": 0.15, "learning_rate": 4.8168096270391715e-06, "loss": 1.2044, "step": 4944 }, { "epoch": 0.15, "learning_rate": 4.816717964727969e-06, "loss": 1.0645, "step": 4945 }, { "epoch": 0.15, "learning_rate": 4.816626280362728e-06, "loss": 1.2051, "step": 4946 }, { "epoch": 0.15, "learning_rate": 4.816534573944318e-06, "loss": 1.0785, "step": 4947 }, { "epoch": 0.15, "learning_rate": 4.8164428454736156e-06, "loss": 1.1326, "step": 4948 }, { "epoch": 0.15, "learning_rate": 4.816351094951493e-06, "loss": 1.173, "step": 4949 }, { "epoch": 0.15, "learning_rate": 4.816259322378825e-06, "loss": 1.1928, "step": 4950 }, { "epoch": 0.15, "learning_rate": 4.816167527756482e-06, "loss": 1.2097, "step": 4951 }, { "epoch": 0.15, "learning_rate": 4.81607571108534e-06, "loss": 1.0623, "step": 4952 }, { "epoch": 0.15, "learning_rate": 4.815983872366273e-06, "loss": 1.149, "step": 4953 }, { "epoch": 0.15, "learning_rate": 4.815892011600155e-06, "loss": 1.1465, "step": 4954 }, { "epoch": 0.15, "learning_rate": 4.815800128787859e-06, "loss": 1.1523, "step": 4955 }, { "epoch": 0.15, "learning_rate": 4.8157082239302634e-06, "loss": 1.1624, "step": 4956 }, { "epoch": 0.15, "learning_rate": 4.8156162970282395e-06, "loss": 1.1255, "step": 4957 }, { "epoch": 0.15, "learning_rate": 4.815524348082664e-06, "loss": 1.2352, "step": 4958 }, { "epoch": 0.15, "learning_rate": 4.8154323770944125e-06, "loss": 1.0963, "step": 4959 }, { "epoch": 0.15, "learning_rate": 4.815340384064359e-06, "loss": 1.1776, "step": 4960 }, { "epoch": 0.15, "learning_rate": 4.81524836899338e-06, "loss": 1.1203, "step": 4961 }, { "epoch": 0.15, "learning_rate": 4.815156331882353e-06, "loss": 1.2274, "step": 4962 }, { "epoch": 0.15, "learning_rate": 4.8150642727321506e-06, "loss": 1.09, "step": 4963 }, { "epoch": 0.15, "learning_rate": 4.814972191543653e-06, "loss": 1.1463, "step": 4964 }, { "epoch": 0.15, "learning_rate": 4.814880088317734e-06, "loss": 1.0845, "step": 4965 }, { "epoch": 0.15, "learning_rate": 4.814787963055273e-06, "loss": 1.2043, "step": 4966 }, { "epoch": 0.15, "learning_rate": 4.814695815757144e-06, "loss": 1.1557, "step": 4967 }, { "epoch": 0.15, "learning_rate": 4.814603646424226e-06, "loss": 1.1121, "step": 4968 }, { "epoch": 0.15, "learning_rate": 4.814511455057396e-06, "loss": 1.2373, "step": 4969 }, { "epoch": 0.15, "learning_rate": 4.814419241657531e-06, "loss": 1.123, "step": 4970 }, { "epoch": 0.15, "learning_rate": 4.814327006225511e-06, "loss": 1.1134, "step": 4971 }, { "epoch": 0.15, "learning_rate": 4.814234748762211e-06, "loss": 1.095, "step": 4972 }, { "epoch": 0.15, "learning_rate": 4.814142469268512e-06, "loss": 1.2777, "step": 4973 }, { "epoch": 0.15, "learning_rate": 4.81405016774529e-06, "loss": 1.0357, "step": 4974 }, { "epoch": 0.15, "learning_rate": 4.813957844193426e-06, "loss": 1.2346, "step": 4975 }, { "epoch": 0.15, "learning_rate": 4.813865498613797e-06, "loss": 1.1519, "step": 4976 }, { "epoch": 0.15, "learning_rate": 4.813773131007283e-06, "loss": 1.1615, "step": 4977 }, { "epoch": 0.15, "learning_rate": 4.8136807413747635e-06, "loss": 1.121, "step": 4978 }, { "epoch": 0.15, "learning_rate": 4.813588329717118e-06, "loss": 1.1741, "step": 4979 }, { "epoch": 0.15, "learning_rate": 4.813495896035225e-06, "loss": 1.3403, "step": 4980 }, { "epoch": 0.15, "learning_rate": 4.813403440329966e-06, "loss": 1.02, "step": 4981 }, { "epoch": 0.15, "learning_rate": 4.81331096260222e-06, "loss": 1.1896, "step": 4982 }, { "epoch": 0.15, "learning_rate": 4.8132184628528675e-06, "loss": 1.2369, "step": 4983 }, { "epoch": 0.15, "learning_rate": 4.81312594108279e-06, "loss": 1.1497, "step": 4984 }, { "epoch": 0.15, "learning_rate": 4.813033397292867e-06, "loss": 1.1135, "step": 4985 }, { "epoch": 0.15, "learning_rate": 4.812940831483981e-06, "loss": 1.214, "step": 4986 }, { "epoch": 0.15, "learning_rate": 4.812848243657011e-06, "loss": 1.3073, "step": 4987 }, { "epoch": 0.15, "learning_rate": 4.81275563381284e-06, "loss": 1.3121, "step": 4988 }, { "epoch": 0.15, "learning_rate": 4.812663001952349e-06, "loss": 1.0705, "step": 4989 }, { "epoch": 0.15, "learning_rate": 4.812570348076421e-06, "loss": 1.2297, "step": 4990 }, { "epoch": 0.15, "learning_rate": 4.812477672185936e-06, "loss": 1.0856, "step": 4991 }, { "epoch": 0.15, "learning_rate": 4.812384974281778e-06, "loss": 1.039, "step": 4992 }, { "epoch": 0.15, "learning_rate": 4.812292254364829e-06, "loss": 1.2058, "step": 4993 }, { "epoch": 0.15, "learning_rate": 4.81219951243597e-06, "loss": 1.1547, "step": 4994 }, { "epoch": 0.15, "learning_rate": 4.8121067484960856e-06, "loss": 1.1648, "step": 4995 }, { "epoch": 0.15, "learning_rate": 4.8120139625460596e-06, "loss": 1.1292, "step": 4996 }, { "epoch": 0.15, "learning_rate": 4.8119211545867735e-06, "loss": 1.1588, "step": 4997 }, { "epoch": 0.15, "learning_rate": 4.811828324619112e-06, "loss": 1.1927, "step": 4998 }, { "epoch": 0.15, "learning_rate": 4.811735472643958e-06, "loss": 1.1909, "step": 4999 }, { "epoch": 0.15, "learning_rate": 4.8116425986621955e-06, "loss": 1.0789, "step": 5000 }, { "epoch": 0.15, "learning_rate": 4.811549702674708e-06, "loss": 1.1527, "step": 5001 }, { "epoch": 0.15, "learning_rate": 4.811456784682381e-06, "loss": 1.1495, "step": 5002 }, { "epoch": 0.15, "learning_rate": 4.8113638446861e-06, "loss": 1.1155, "step": 5003 }, { "epoch": 0.15, "learning_rate": 4.811270882686747e-06, "loss": 1.1055, "step": 5004 }, { "epoch": 0.15, "learning_rate": 4.811177898685209e-06, "loss": 1.1334, "step": 5005 }, { "epoch": 0.15, "learning_rate": 4.81108489268237e-06, "loss": 1.2993, "step": 5006 }, { "epoch": 0.15, "learning_rate": 4.810991864679116e-06, "loss": 1.1677, "step": 5007 }, { "epoch": 0.15, "learning_rate": 4.810898814676332e-06, "loss": 1.1292, "step": 5008 }, { "epoch": 0.15, "learning_rate": 4.810805742674905e-06, "loss": 1.1346, "step": 5009 }, { "epoch": 0.15, "learning_rate": 4.81071264867572e-06, "loss": 1.1223, "step": 5010 }, { "epoch": 0.15, "learning_rate": 4.810619532679665e-06, "loss": 1.0984, "step": 5011 }, { "epoch": 0.15, "learning_rate": 4.810526394687623e-06, "loss": 1.1603, "step": 5012 }, { "epoch": 0.15, "learning_rate": 4.8104332347004825e-06, "loss": 1.0208, "step": 5013 }, { "epoch": 0.15, "learning_rate": 4.8103400527191305e-06, "loss": 1.0662, "step": 5014 }, { "epoch": 0.15, "learning_rate": 4.8102468487444545e-06, "loss": 1.1199, "step": 5015 }, { "epoch": 0.15, "learning_rate": 4.810153622777341e-06, "loss": 1.2205, "step": 5016 }, { "epoch": 0.15, "learning_rate": 4.810060374818677e-06, "loss": 1.214, "step": 5017 }, { "epoch": 0.15, "learning_rate": 4.809967104869352e-06, "loss": 1.0439, "step": 5018 }, { "epoch": 0.15, "learning_rate": 4.809873812930251e-06, "loss": 1.0739, "step": 5019 }, { "epoch": 0.15, "learning_rate": 4.809780499002265e-06, "loss": 1.0901, "step": 5020 }, { "epoch": 0.15, "learning_rate": 4.8096871630862805e-06, "loss": 1.0663, "step": 5021 }, { "epoch": 0.15, "learning_rate": 4.809593805183188e-06, "loss": 1.2134, "step": 5022 }, { "epoch": 0.15, "learning_rate": 4.8095004252938734e-06, "loss": 1.2107, "step": 5023 }, { "epoch": 0.15, "learning_rate": 4.809407023419227e-06, "loss": 1.2422, "step": 5024 }, { "epoch": 0.15, "learning_rate": 4.809313599560138e-06, "loss": 1.1893, "step": 5025 }, { "epoch": 0.15, "learning_rate": 4.809220153717496e-06, "loss": 1.1165, "step": 5026 }, { "epoch": 0.15, "learning_rate": 4.809126685892191e-06, "loss": 1.2026, "step": 5027 }, { "epoch": 0.15, "learning_rate": 4.809033196085111e-06, "loss": 1.2147, "step": 5028 }, { "epoch": 0.15, "learning_rate": 4.808939684297148e-06, "loss": 1.1351, "step": 5029 }, { "epoch": 0.15, "learning_rate": 4.808846150529191e-06, "loss": 1.1105, "step": 5030 }, { "epoch": 0.15, "learning_rate": 4.808752594782129e-06, "loss": 1.4191, "step": 5031 }, { "epoch": 0.15, "learning_rate": 4.8086590170568555e-06, "loss": 1.1785, "step": 5032 }, { "epoch": 0.15, "learning_rate": 4.808565417354261e-06, "loss": 1.1122, "step": 5033 }, { "epoch": 0.15, "learning_rate": 4.808471795675234e-06, "loss": 1.0389, "step": 5034 }, { "epoch": 0.15, "learning_rate": 4.808378152020668e-06, "loss": 1.1638, "step": 5035 }, { "epoch": 0.15, "learning_rate": 4.808284486391454e-06, "loss": 1.1989, "step": 5036 }, { "epoch": 0.15, "learning_rate": 4.808190798788483e-06, "loss": 1.1152, "step": 5037 }, { "epoch": 0.15, "learning_rate": 4.808097089212648e-06, "loss": 1.224, "step": 5038 }, { "epoch": 0.15, "learning_rate": 4.808003357664839e-06, "loss": 1.1389, "step": 5039 }, { "epoch": 0.15, "learning_rate": 4.80790960414595e-06, "loss": 1.1191, "step": 5040 }, { "epoch": 0.15, "learning_rate": 4.807815828656874e-06, "loss": 1.1243, "step": 5041 }, { "epoch": 0.15, "learning_rate": 4.807722031198503e-06, "loss": 1.1681, "step": 5042 }, { "epoch": 0.15, "learning_rate": 4.807628211771728e-06, "loss": 1.2104, "step": 5043 }, { "epoch": 0.15, "learning_rate": 4.807534370377445e-06, "loss": 1.1375, "step": 5044 }, { "epoch": 0.15, "learning_rate": 4.8074405070165455e-06, "loss": 1.1595, "step": 5045 }, { "epoch": 0.15, "learning_rate": 4.807346621689925e-06, "loss": 1.0242, "step": 5046 }, { "epoch": 0.15, "learning_rate": 4.807252714398474e-06, "loss": 1.0185, "step": 5047 }, { "epoch": 0.15, "learning_rate": 4.807158785143089e-06, "loss": 1.1443, "step": 5048 }, { "epoch": 0.15, "learning_rate": 4.807064833924664e-06, "loss": 1.2345, "step": 5049 }, { "epoch": 0.15, "learning_rate": 4.806970860744093e-06, "loss": 1.147, "step": 5050 }, { "epoch": 0.15, "learning_rate": 4.80687686560227e-06, "loss": 1.2158, "step": 5051 }, { "epoch": 0.15, "learning_rate": 4.806782848500091e-06, "loss": 1.1522, "step": 5052 }, { "epoch": 0.15, "learning_rate": 4.806688809438449e-06, "loss": 1.136, "step": 5053 }, { "epoch": 0.15, "learning_rate": 4.806594748418242e-06, "loss": 1.262, "step": 5054 }, { "epoch": 0.15, "learning_rate": 4.806500665440363e-06, "loss": 1.2354, "step": 5055 }, { "epoch": 0.15, "learning_rate": 4.806406560505709e-06, "loss": 1.2668, "step": 5056 }, { "epoch": 0.15, "learning_rate": 4.806312433615174e-06, "loss": 1.2189, "step": 5057 }, { "epoch": 0.15, "learning_rate": 4.806218284769657e-06, "loss": 1.1194, "step": 5058 }, { "epoch": 0.15, "learning_rate": 4.806124113970052e-06, "loss": 1.1742, "step": 5059 }, { "epoch": 0.15, "learning_rate": 4.806029921217255e-06, "loss": 1.0375, "step": 5060 }, { "epoch": 0.15, "learning_rate": 4.805935706512166e-06, "loss": 1.1276, "step": 5061 }, { "epoch": 0.15, "learning_rate": 4.805841469855679e-06, "loss": 1.1486, "step": 5062 }, { "epoch": 0.15, "learning_rate": 4.80574721124869e-06, "loss": 1.1151, "step": 5063 }, { "epoch": 0.15, "learning_rate": 4.805652930692099e-06, "loss": 1.1364, "step": 5064 }, { "epoch": 0.15, "learning_rate": 4.805558628186804e-06, "loss": 1.1827, "step": 5065 }, { "epoch": 0.15, "learning_rate": 4.8054643037337e-06, "loss": 1.1951, "step": 5066 }, { "epoch": 0.15, "learning_rate": 4.805369957333687e-06, "loss": 1.222, "step": 5067 }, { "epoch": 0.15, "learning_rate": 4.805275588987661e-06, "loss": 1.3074, "step": 5068 }, { "epoch": 0.15, "learning_rate": 4.805181198696523e-06, "loss": 1.1169, "step": 5069 }, { "epoch": 0.15, "learning_rate": 4.805086786461168e-06, "loss": 1.0183, "step": 5070 }, { "epoch": 0.15, "learning_rate": 4.804992352282499e-06, "loss": 1.1468, "step": 5071 }, { "epoch": 0.15, "learning_rate": 4.804897896161413e-06, "loss": 1.1483, "step": 5072 }, { "epoch": 0.15, "learning_rate": 4.804803418098808e-06, "loss": 1.1509, "step": 5073 }, { "epoch": 0.15, "learning_rate": 4.804708918095585e-06, "loss": 1.2374, "step": 5074 }, { "epoch": 0.15, "learning_rate": 4.804614396152643e-06, "loss": 1.1105, "step": 5075 }, { "epoch": 0.15, "learning_rate": 4.804519852270881e-06, "loss": 1.144, "step": 5076 }, { "epoch": 0.15, "learning_rate": 4.8044252864512015e-06, "loss": 1.1907, "step": 5077 }, { "epoch": 0.15, "learning_rate": 4.804330698694503e-06, "loss": 1.1226, "step": 5078 }, { "epoch": 0.15, "learning_rate": 4.804236089001685e-06, "loss": 1.1998, "step": 5079 }, { "epoch": 0.15, "learning_rate": 4.804141457373649e-06, "loss": 1.1606, "step": 5080 }, { "epoch": 0.15, "learning_rate": 4.804046803811297e-06, "loss": 1.1799, "step": 5081 }, { "epoch": 0.15, "learning_rate": 4.803952128315529e-06, "loss": 1.1535, "step": 5082 }, { "epoch": 0.15, "learning_rate": 4.8038574308872465e-06, "loss": 1.1377, "step": 5083 }, { "epoch": 0.15, "learning_rate": 4.80376271152735e-06, "loss": 1.0872, "step": 5084 }, { "epoch": 0.15, "learning_rate": 4.803667970236743e-06, "loss": 1.1593, "step": 5085 }, { "epoch": 0.15, "learning_rate": 4.803573207016326e-06, "loss": 1.1462, "step": 5086 }, { "epoch": 0.15, "learning_rate": 4.803478421867001e-06, "loss": 1.2089, "step": 5087 }, { "epoch": 0.15, "learning_rate": 4.8033836147896716e-06, "loss": 1.108, "step": 5088 }, { "epoch": 0.15, "learning_rate": 4.803288785785239e-06, "loss": 1.1132, "step": 5089 }, { "epoch": 0.15, "learning_rate": 4.8031939348546065e-06, "loss": 1.087, "step": 5090 }, { "epoch": 0.15, "learning_rate": 4.803099061998677e-06, "loss": 1.2229, "step": 5091 }, { "epoch": 0.15, "learning_rate": 4.803004167218354e-06, "loss": 1.2051, "step": 5092 }, { "epoch": 0.15, "learning_rate": 4.80290925051454e-06, "loss": 1.1635, "step": 5093 }, { "epoch": 0.15, "learning_rate": 4.80281431188814e-06, "loss": 1.1368, "step": 5094 }, { "epoch": 0.15, "learning_rate": 4.802719351340056e-06, "loss": 1.1089, "step": 5095 }, { "epoch": 0.15, "learning_rate": 4.802624368871193e-06, "loss": 1.0936, "step": 5096 }, { "epoch": 0.15, "learning_rate": 4.802529364482454e-06, "loss": 1.0743, "step": 5097 }, { "epoch": 0.15, "learning_rate": 4.802434338174746e-06, "loss": 1.1782, "step": 5098 }, { "epoch": 0.15, "learning_rate": 4.802339289948972e-06, "loss": 1.1799, "step": 5099 }, { "epoch": 0.15, "learning_rate": 4.802244219806036e-06, "loss": 1.0917, "step": 5100 }, { "epoch": 0.15, "learning_rate": 4.8021491277468435e-06, "loss": 1.205, "step": 5101 }, { "epoch": 0.15, "learning_rate": 4.8020540137723e-06, "loss": 1.2088, "step": 5102 }, { "epoch": 0.15, "learning_rate": 4.801958877883312e-06, "loss": 1.1582, "step": 5103 }, { "epoch": 0.15, "learning_rate": 4.8018637200807835e-06, "loss": 1.2324, "step": 5104 }, { "epoch": 0.15, "learning_rate": 4.801768540365621e-06, "loss": 1.2178, "step": 5105 }, { "epoch": 0.15, "learning_rate": 4.801673338738732e-06, "loss": 1.209, "step": 5106 }, { "epoch": 0.15, "learning_rate": 4.801578115201019e-06, "loss": 1.1141, "step": 5107 }, { "epoch": 0.15, "learning_rate": 4.801482869753392e-06, "loss": 1.1453, "step": 5108 }, { "epoch": 0.15, "learning_rate": 4.801387602396756e-06, "loss": 1.166, "step": 5109 }, { "epoch": 0.15, "learning_rate": 4.801292313132019e-06, "loss": 1.0884, "step": 5110 }, { "epoch": 0.15, "learning_rate": 4.801197001960088e-06, "loss": 1.0355, "step": 5111 }, { "epoch": 0.15, "learning_rate": 4.801101668881869e-06, "loss": 1.1458, "step": 5112 }, { "epoch": 0.15, "learning_rate": 4.80100631389827e-06, "loss": 1.1725, "step": 5113 }, { "epoch": 0.15, "learning_rate": 4.8009109370102e-06, "loss": 1.1165, "step": 5114 }, { "epoch": 0.15, "learning_rate": 4.800815538218566e-06, "loss": 1.1827, "step": 5115 }, { "epoch": 0.15, "learning_rate": 4.800720117524276e-06, "loss": 1.1402, "step": 5116 }, { "epoch": 0.15, "learning_rate": 4.800624674928238e-06, "loss": 1.216, "step": 5117 }, { "epoch": 0.15, "learning_rate": 4.800529210431362e-06, "loss": 1.3055, "step": 5118 }, { "epoch": 0.15, "learning_rate": 4.8004337240345545e-06, "loss": 1.2327, "step": 5119 }, { "epoch": 0.15, "learning_rate": 4.800338215738727e-06, "loss": 1.1867, "step": 5120 }, { "epoch": 0.15, "learning_rate": 4.800242685544787e-06, "loss": 1.0835, "step": 5121 }, { "epoch": 0.15, "learning_rate": 4.800147133453645e-06, "loss": 1.1528, "step": 5122 }, { "epoch": 0.15, "learning_rate": 4.80005155946621e-06, "loss": 1.1261, "step": 5123 }, { "epoch": 0.15, "learning_rate": 4.799955963583392e-06, "loss": 1.3672, "step": 5124 }, { "epoch": 0.15, "learning_rate": 4.7998603458061e-06, "loss": 0.9269, "step": 5125 }, { "epoch": 0.15, "learning_rate": 4.799764706135246e-06, "loss": 1.2244, "step": 5126 }, { "epoch": 0.15, "learning_rate": 4.7996690445717395e-06, "loss": 1.1081, "step": 5127 }, { "epoch": 0.15, "learning_rate": 4.799573361116492e-06, "loss": 1.1327, "step": 5128 }, { "epoch": 0.15, "learning_rate": 4.799477655770412e-06, "loss": 1.1406, "step": 5129 }, { "epoch": 0.15, "learning_rate": 4.799381928534413e-06, "loss": 1.2645, "step": 5130 }, { "epoch": 0.15, "learning_rate": 4.799286179409406e-06, "loss": 1.1198, "step": 5131 }, { "epoch": 0.15, "learning_rate": 4.799190408396302e-06, "loss": 1.18, "step": 5132 }, { "epoch": 0.15, "learning_rate": 4.7990946154960115e-06, "loss": 1.187, "step": 5133 }, { "epoch": 0.15, "learning_rate": 4.798998800709448e-06, "loss": 1.1383, "step": 5134 }, { "epoch": 0.15, "learning_rate": 4.798902964037523e-06, "loss": 1.1651, "step": 5135 }, { "epoch": 0.15, "learning_rate": 4.798807105481149e-06, "loss": 1.223, "step": 5136 }, { "epoch": 0.15, "learning_rate": 4.798711225041239e-06, "loss": 1.2248, "step": 5137 }, { "epoch": 0.15, "learning_rate": 4.7986153227187045e-06, "loss": 1.1514, "step": 5138 }, { "epoch": 0.15, "learning_rate": 4.79851939851446e-06, "loss": 1.1865, "step": 5139 }, { "epoch": 0.15, "learning_rate": 4.798423452429417e-06, "loss": 1.1107, "step": 5140 }, { "epoch": 0.15, "learning_rate": 4.798327484464491e-06, "loss": 1.3209, "step": 5141 }, { "epoch": 0.15, "learning_rate": 4.798231494620593e-06, "loss": 1.2887, "step": 5142 }, { "epoch": 0.15, "learning_rate": 4.798135482898639e-06, "loss": 1.1479, "step": 5143 }, { "epoch": 0.15, "learning_rate": 4.79803944929954e-06, "loss": 1.2063, "step": 5144 }, { "epoch": 0.15, "learning_rate": 4.797943393824215e-06, "loss": 1.1616, "step": 5145 }, { "epoch": 0.16, "learning_rate": 4.797847316473574e-06, "loss": 1.1306, "step": 5146 }, { "epoch": 0.16, "learning_rate": 4.797751217248534e-06, "loss": 1.0566, "step": 5147 }, { "epoch": 0.16, "learning_rate": 4.797655096150008e-06, "loss": 1.2606, "step": 5148 }, { "epoch": 0.16, "learning_rate": 4.797558953178913e-06, "loss": 1.1158, "step": 5149 }, { "epoch": 0.16, "learning_rate": 4.797462788336163e-06, "loss": 1.0999, "step": 5150 }, { "epoch": 0.16, "learning_rate": 4.797366601622674e-06, "loss": 1.2336, "step": 5151 }, { "epoch": 0.16, "learning_rate": 4.79727039303936e-06, "loss": 1.16, "step": 5152 }, { "epoch": 0.16, "learning_rate": 4.79717416258714e-06, "loss": 1.1582, "step": 5153 }, { "epoch": 0.16, "learning_rate": 4.797077910266928e-06, "loss": 1.2222, "step": 5154 }, { "epoch": 0.16, "learning_rate": 4.7969816360796404e-06, "loss": 1.2292, "step": 5155 }, { "epoch": 0.16, "learning_rate": 4.796885340026194e-06, "loss": 1.1233, "step": 5156 }, { "epoch": 0.16, "learning_rate": 4.796789022107505e-06, "loss": 1.1117, "step": 5157 }, { "epoch": 0.16, "learning_rate": 4.796692682324491e-06, "loss": 1.0991, "step": 5158 }, { "epoch": 0.16, "learning_rate": 4.796596320678069e-06, "loss": 1.0634, "step": 5159 }, { "epoch": 0.16, "learning_rate": 4.796499937169156e-06, "loss": 1.1321, "step": 5160 }, { "epoch": 0.16, "learning_rate": 4.796403531798669e-06, "loss": 1.087, "step": 5161 }, { "epoch": 0.16, "learning_rate": 4.796307104567526e-06, "loss": 1.2208, "step": 5162 }, { "epoch": 0.16, "learning_rate": 4.796210655476646e-06, "loss": 1.1945, "step": 5163 }, { "epoch": 0.16, "learning_rate": 4.796114184526946e-06, "loss": 1.1485, "step": 5164 }, { "epoch": 0.16, "learning_rate": 4.796017691719346e-06, "loss": 1.1069, "step": 5165 }, { "epoch": 0.16, "learning_rate": 4.795921177054763e-06, "loss": 1.0988, "step": 5166 }, { "epoch": 0.16, "learning_rate": 4.795824640534116e-06, "loss": 1.1996, "step": 5167 }, { "epoch": 0.16, "learning_rate": 4.795728082158324e-06, "loss": 1.2009, "step": 5168 }, { "epoch": 0.16, "learning_rate": 4.795631501928306e-06, "loss": 1.1311, "step": 5169 }, { "epoch": 0.16, "learning_rate": 4.795534899844983e-06, "loss": 1.2148, "step": 5170 }, { "epoch": 0.16, "learning_rate": 4.795438275909272e-06, "loss": 1.1984, "step": 5171 }, { "epoch": 0.16, "learning_rate": 4.795341630122094e-06, "loss": 1.1733, "step": 5172 }, { "epoch": 0.16, "learning_rate": 4.79524496248437e-06, "loss": 1.1032, "step": 5173 }, { "epoch": 0.16, "learning_rate": 4.795148272997019e-06, "loss": 1.222, "step": 5174 }, { "epoch": 0.16, "learning_rate": 4.795051561660962e-06, "loss": 1.2019, "step": 5175 }, { "epoch": 0.16, "learning_rate": 4.794954828477118e-06, "loss": 1.2465, "step": 5176 }, { "epoch": 0.16, "learning_rate": 4.794858073446411e-06, "loss": 1.1713, "step": 5177 }, { "epoch": 0.16, "learning_rate": 4.7947612965697605e-06, "loss": 1.108, "step": 5178 }, { "epoch": 0.16, "learning_rate": 4.794664497848087e-06, "loss": 1.319, "step": 5179 }, { "epoch": 0.16, "learning_rate": 4.794567677282312e-06, "loss": 1.2516, "step": 5180 }, { "epoch": 0.16, "learning_rate": 4.794470834873359e-06, "loss": 1.1625, "step": 5181 }, { "epoch": 0.16, "learning_rate": 4.794373970622149e-06, "loss": 1.0878, "step": 5182 }, { "epoch": 0.16, "learning_rate": 4.7942770845296026e-06, "loss": 1.1326, "step": 5183 }, { "epoch": 0.16, "learning_rate": 4.794180176596645e-06, "loss": 1.1215, "step": 5184 }, { "epoch": 0.16, "learning_rate": 4.794083246824195e-06, "loss": 1.1087, "step": 5185 }, { "epoch": 0.16, "learning_rate": 4.793986295213178e-06, "loss": 1.1684, "step": 5186 }, { "epoch": 0.16, "learning_rate": 4.793889321764516e-06, "loss": 1.1422, "step": 5187 }, { "epoch": 0.16, "learning_rate": 4.7937923264791336e-06, "loss": 1.0951, "step": 5188 }, { "epoch": 0.16, "learning_rate": 4.793695309357952e-06, "loss": 1.2001, "step": 5189 }, { "epoch": 0.16, "learning_rate": 4.793598270401896e-06, "loss": 1.0921, "step": 5190 }, { "epoch": 0.16, "learning_rate": 4.793501209611889e-06, "loss": 1.1958, "step": 5191 }, { "epoch": 0.16, "learning_rate": 4.7934041269888556e-06, "loss": 1.0997, "step": 5192 }, { "epoch": 0.16, "learning_rate": 4.7933070225337195e-06, "loss": 1.2867, "step": 5193 }, { "epoch": 0.16, "learning_rate": 4.793209896247404e-06, "loss": 1.2368, "step": 5194 }, { "epoch": 0.16, "learning_rate": 4.793112748130836e-06, "loss": 1.1237, "step": 5195 }, { "epoch": 0.16, "learning_rate": 4.793015578184939e-06, "loss": 1.1047, "step": 5196 }, { "epoch": 0.16, "learning_rate": 4.792918386410636e-06, "loss": 1.1479, "step": 5197 }, { "epoch": 0.16, "learning_rate": 4.7928211728088566e-06, "loss": 1.1693, "step": 5198 }, { "epoch": 0.16, "learning_rate": 4.7927239373805225e-06, "loss": 1.207, "step": 5199 }, { "epoch": 0.16, "learning_rate": 4.792626680126562e-06, "loss": 1.0853, "step": 5200 }, { "epoch": 0.16, "learning_rate": 4.7925294010478985e-06, "loss": 1.2275, "step": 5201 }, { "epoch": 0.16, "learning_rate": 4.79243210014546e-06, "loss": 1.1014, "step": 5202 }, { "epoch": 0.16, "learning_rate": 4.792334777420171e-06, "loss": 1.1152, "step": 5203 }, { "epoch": 0.16, "learning_rate": 4.79223743287296e-06, "loss": 1.0895, "step": 5204 }, { "epoch": 0.16, "learning_rate": 4.7921400665047525e-06, "loss": 1.1561, "step": 5205 }, { "epoch": 0.16, "learning_rate": 4.7920426783164744e-06, "loss": 1.0991, "step": 5206 }, { "epoch": 0.16, "learning_rate": 4.791945268309055e-06, "loss": 1.0561, "step": 5207 }, { "epoch": 0.16, "learning_rate": 4.791847836483419e-06, "loss": 1.0544, "step": 5208 }, { "epoch": 0.16, "learning_rate": 4.7917503828404975e-06, "loss": 1.0611, "step": 5209 }, { "epoch": 0.16, "learning_rate": 4.791652907381215e-06, "loss": 1.1123, "step": 5210 }, { "epoch": 0.16, "learning_rate": 4.791555410106501e-06, "loss": 1.2568, "step": 5211 }, { "epoch": 0.16, "learning_rate": 4.7914578910172825e-06, "loss": 1.1375, "step": 5212 }, { "epoch": 0.16, "learning_rate": 4.791360350114489e-06, "loss": 1.2201, "step": 5213 }, { "epoch": 0.16, "learning_rate": 4.791262787399048e-06, "loss": 1.1583, "step": 5214 }, { "epoch": 0.16, "learning_rate": 4.79116520287189e-06, "loss": 1.1538, "step": 5215 }, { "epoch": 0.16, "learning_rate": 4.791067596533941e-06, "loss": 1.1772, "step": 5216 }, { "epoch": 0.16, "learning_rate": 4.790969968386133e-06, "loss": 1.2493, "step": 5217 }, { "epoch": 0.16, "learning_rate": 4.790872318429394e-06, "loss": 1.244, "step": 5218 }, { "epoch": 0.16, "learning_rate": 4.790774646664654e-06, "loss": 1.2781, "step": 5219 }, { "epoch": 0.16, "learning_rate": 4.790676953092842e-06, "loss": 1.0705, "step": 5220 }, { "epoch": 0.16, "learning_rate": 4.790579237714889e-06, "loss": 1.1285, "step": 5221 }, { "epoch": 0.16, "learning_rate": 4.790481500531725e-06, "loss": 1.1677, "step": 5222 }, { "epoch": 0.16, "learning_rate": 4.790383741544281e-06, "loss": 1.2615, "step": 5223 }, { "epoch": 0.16, "learning_rate": 4.790285960753485e-06, "loss": 1.1738, "step": 5224 }, { "epoch": 0.16, "learning_rate": 4.790188158160271e-06, "loss": 1.2207, "step": 5225 }, { "epoch": 0.16, "learning_rate": 4.790090333765569e-06, "loss": 1.1785, "step": 5226 }, { "epoch": 0.16, "learning_rate": 4.789992487570309e-06, "loss": 1.2112, "step": 5227 }, { "epoch": 0.16, "learning_rate": 4.789894619575424e-06, "loss": 1.0961, "step": 5228 }, { "epoch": 0.16, "learning_rate": 4.789796729781845e-06, "loss": 1.1276, "step": 5229 }, { "epoch": 0.16, "learning_rate": 4.789698818190504e-06, "loss": 1.2294, "step": 5230 }, { "epoch": 0.16, "learning_rate": 4.789600884802333e-06, "loss": 1.225, "step": 5231 }, { "epoch": 0.16, "learning_rate": 4.789502929618264e-06, "loss": 1.1672, "step": 5232 }, { "epoch": 0.16, "learning_rate": 4.78940495263923e-06, "loss": 1.1528, "step": 5233 }, { "epoch": 0.16, "learning_rate": 4.789306953866163e-06, "loss": 1.137, "step": 5234 }, { "epoch": 0.16, "learning_rate": 4.789208933299997e-06, "loss": 1.0794, "step": 5235 }, { "epoch": 0.16, "learning_rate": 4.789110890941664e-06, "loss": 1.1237, "step": 5236 }, { "epoch": 0.16, "learning_rate": 4.789012826792099e-06, "loss": 1.1015, "step": 5237 }, { "epoch": 0.16, "learning_rate": 4.7889147408522326e-06, "loss": 1.1232, "step": 5238 }, { "epoch": 0.16, "learning_rate": 4.788816633123001e-06, "loss": 1.1031, "step": 5239 }, { "epoch": 0.16, "learning_rate": 4.788718503605338e-06, "loss": 1.1666, "step": 5240 }, { "epoch": 0.16, "learning_rate": 4.788620352300176e-06, "loss": 1.1739, "step": 5241 }, { "epoch": 0.16, "learning_rate": 4.7885221792084515e-06, "loss": 1.2026, "step": 5242 }, { "epoch": 0.16, "learning_rate": 4.788423984331098e-06, "loss": 1.2251, "step": 5243 }, { "epoch": 0.16, "learning_rate": 4.788325767669049e-06, "loss": 1.1105, "step": 5244 }, { "epoch": 0.16, "learning_rate": 4.788227529223242e-06, "loss": 1.1141, "step": 5245 }, { "epoch": 0.16, "learning_rate": 4.7881292689946105e-06, "loss": 1.1154, "step": 5246 }, { "epoch": 0.16, "learning_rate": 4.788030986984091e-06, "loss": 1.1874, "step": 5247 }, { "epoch": 0.16, "learning_rate": 4.787932683192617e-06, "loss": 1.2575, "step": 5248 }, { "epoch": 0.16, "learning_rate": 4.787834357621127e-06, "loss": 1.3188, "step": 5249 }, { "epoch": 0.16, "learning_rate": 4.787736010270556e-06, "loss": 1.2408, "step": 5250 }, { "epoch": 0.16, "learning_rate": 4.787637641141839e-06, "loss": 1.1522, "step": 5251 }, { "epoch": 0.16, "learning_rate": 4.787539250235914e-06, "loss": 1.0325, "step": 5252 }, { "epoch": 0.16, "learning_rate": 4.787440837553717e-06, "loss": 0.9888, "step": 5253 }, { "epoch": 0.16, "learning_rate": 4.7873424030961845e-06, "loss": 1.114, "step": 5254 }, { "epoch": 0.16, "learning_rate": 4.7872439468642544e-06, "loss": 1.2681, "step": 5255 }, { "epoch": 0.16, "learning_rate": 4.787145468858864e-06, "loss": 1.1019, "step": 5256 }, { "epoch": 0.16, "learning_rate": 4.78704696908095e-06, "loss": 1.2061, "step": 5257 }, { "epoch": 0.16, "learning_rate": 4.78694844753145e-06, "loss": 1.1344, "step": 5258 }, { "epoch": 0.16, "learning_rate": 4.786849904211301e-06, "loss": 1.1289, "step": 5259 }, { "epoch": 0.16, "learning_rate": 4.786751339121444e-06, "loss": 1.0967, "step": 5260 }, { "epoch": 0.16, "learning_rate": 4.786652752262815e-06, "loss": 1.1772, "step": 5261 }, { "epoch": 0.16, "learning_rate": 4.786554143636353e-06, "loss": 1.2552, "step": 5262 }, { "epoch": 0.16, "learning_rate": 4.7864555132429965e-06, "loss": 1.1265, "step": 5263 }, { "epoch": 0.16, "learning_rate": 4.786356861083686e-06, "loss": 1.1558, "step": 5264 }, { "epoch": 0.16, "learning_rate": 4.7862581871593585e-06, "loss": 1.2089, "step": 5265 }, { "epoch": 0.16, "learning_rate": 4.786159491470954e-06, "loss": 1.079, "step": 5266 }, { "epoch": 0.16, "learning_rate": 4.786060774019412e-06, "loss": 1.1916, "step": 5267 }, { "epoch": 0.16, "learning_rate": 4.785962034805674e-06, "loss": 1.1199, "step": 5268 }, { "epoch": 0.16, "learning_rate": 4.785863273830676e-06, "loss": 1.045, "step": 5269 }, { "epoch": 0.16, "learning_rate": 4.7857644910953615e-06, "loss": 1.1873, "step": 5270 }, { "epoch": 0.16, "learning_rate": 4.785665686600671e-06, "loss": 1.1522, "step": 5271 }, { "epoch": 0.16, "learning_rate": 4.785566860347543e-06, "loss": 1.1927, "step": 5272 }, { "epoch": 0.16, "learning_rate": 4.785468012336919e-06, "loss": 1.1454, "step": 5273 }, { "epoch": 0.16, "learning_rate": 4.785369142569741e-06, "loss": 1.0884, "step": 5274 }, { "epoch": 0.16, "learning_rate": 4.785270251046949e-06, "loss": 1.0565, "step": 5275 }, { "epoch": 0.16, "learning_rate": 4.785171337769485e-06, "loss": 1.1556, "step": 5276 }, { "epoch": 0.16, "learning_rate": 4.78507240273829e-06, "loss": 1.0682, "step": 5277 }, { "epoch": 0.16, "learning_rate": 4.784973445954306e-06, "loss": 1.1536, "step": 5278 }, { "epoch": 0.16, "learning_rate": 4.784874467418477e-06, "loss": 1.1824, "step": 5279 }, { "epoch": 0.16, "learning_rate": 4.784775467131741e-06, "loss": 1.2235, "step": 5280 }, { "epoch": 0.16, "learning_rate": 4.784676445095045e-06, "loss": 1.1268, "step": 5281 }, { "epoch": 0.16, "learning_rate": 4.784577401309329e-06, "loss": 1.1758, "step": 5282 }, { "epoch": 0.16, "learning_rate": 4.784478335775536e-06, "loss": 1.1127, "step": 5283 }, { "epoch": 0.16, "learning_rate": 4.784379248494609e-06, "loss": 1.1038, "step": 5284 }, { "epoch": 0.16, "learning_rate": 4.784280139467493e-06, "loss": 1.1663, "step": 5285 }, { "epoch": 0.16, "learning_rate": 4.78418100869513e-06, "loss": 1.1868, "step": 5286 }, { "epoch": 0.16, "learning_rate": 4.784081856178464e-06, "loss": 1.1778, "step": 5287 }, { "epoch": 0.16, "learning_rate": 4.783982681918438e-06, "loss": 1.0251, "step": 5288 }, { "epoch": 0.16, "learning_rate": 4.783883485915998e-06, "loss": 1.2044, "step": 5289 }, { "epoch": 0.16, "learning_rate": 4.783784268172086e-06, "loss": 1.08, "step": 5290 }, { "epoch": 0.16, "learning_rate": 4.7836850286876475e-06, "loss": 1.2081, "step": 5291 }, { "epoch": 0.16, "learning_rate": 4.7835857674636285e-06, "loss": 1.1421, "step": 5292 }, { "epoch": 0.16, "learning_rate": 4.783486484500972e-06, "loss": 1.2043, "step": 5293 }, { "epoch": 0.16, "learning_rate": 4.783387179800625e-06, "loss": 1.1685, "step": 5294 }, { "epoch": 0.16, "learning_rate": 4.783287853363531e-06, "loss": 1.1776, "step": 5295 }, { "epoch": 0.16, "learning_rate": 4.783188505190636e-06, "loss": 1.1613, "step": 5296 }, { "epoch": 0.16, "learning_rate": 4.783089135282887e-06, "loss": 1.0831, "step": 5297 }, { "epoch": 0.16, "learning_rate": 4.782989743641227e-06, "loss": 1.1448, "step": 5298 }, { "epoch": 0.16, "learning_rate": 4.782890330266606e-06, "loss": 1.1146, "step": 5299 }, { "epoch": 0.16, "learning_rate": 4.782790895159969e-06, "loss": 1.0209, "step": 5300 }, { "epoch": 0.16, "learning_rate": 4.782691438322261e-06, "loss": 1.0817, "step": 5301 }, { "epoch": 0.16, "learning_rate": 4.78259195975443e-06, "loss": 1.1447, "step": 5302 }, { "epoch": 0.16, "learning_rate": 4.782492459457423e-06, "loss": 1.1526, "step": 5303 }, { "epoch": 0.16, "learning_rate": 4.782392937432186e-06, "loss": 1.0887, "step": 5304 }, { "epoch": 0.16, "learning_rate": 4.782293393679669e-06, "loss": 1.1536, "step": 5305 }, { "epoch": 0.16, "learning_rate": 4.782193828200818e-06, "loss": 1.1808, "step": 5306 }, { "epoch": 0.16, "learning_rate": 4.782094240996581e-06, "loss": 1.2277, "step": 5307 }, { "epoch": 0.16, "learning_rate": 4.781994632067905e-06, "loss": 1.131, "step": 5308 }, { "epoch": 0.16, "learning_rate": 4.78189500141574e-06, "loss": 1.0908, "step": 5309 }, { "epoch": 0.16, "learning_rate": 4.781795349041033e-06, "loss": 1.1775, "step": 5310 }, { "epoch": 0.16, "learning_rate": 4.781695674944733e-06, "loss": 1.2023, "step": 5311 }, { "epoch": 0.16, "learning_rate": 4.781595979127789e-06, "loss": 1.2087, "step": 5312 }, { "epoch": 0.16, "learning_rate": 4.781496261591151e-06, "loss": 1.1953, "step": 5313 }, { "epoch": 0.16, "learning_rate": 4.781396522335768e-06, "loss": 1.12, "step": 5314 }, { "epoch": 0.16, "learning_rate": 4.781296761362587e-06, "loss": 1.0356, "step": 5315 }, { "epoch": 0.16, "learning_rate": 4.78119697867256e-06, "loss": 1.1041, "step": 5316 }, { "epoch": 0.16, "learning_rate": 4.781097174266637e-06, "loss": 1.1564, "step": 5317 }, { "epoch": 0.16, "learning_rate": 4.780997348145767e-06, "loss": 1.2321, "step": 5318 }, { "epoch": 0.16, "learning_rate": 4.780897500310902e-06, "loss": 1.1462, "step": 5319 }, { "epoch": 0.16, "learning_rate": 4.78079763076299e-06, "loss": 1.0704, "step": 5320 }, { "epoch": 0.16, "learning_rate": 4.780697739502984e-06, "loss": 1.0896, "step": 5321 }, { "epoch": 0.16, "learning_rate": 4.780597826531833e-06, "loss": 1.1222, "step": 5322 }, { "epoch": 0.16, "learning_rate": 4.78049789185049e-06, "loss": 1.1356, "step": 5323 }, { "epoch": 0.16, "learning_rate": 4.780397935459904e-06, "loss": 1.1606, "step": 5324 }, { "epoch": 0.16, "learning_rate": 4.780297957361029e-06, "loss": 1.178, "step": 5325 }, { "epoch": 0.16, "learning_rate": 4.7801979575548156e-06, "loss": 1.1563, "step": 5326 }, { "epoch": 0.16, "learning_rate": 4.780097936042216e-06, "loss": 1.1714, "step": 5327 }, { "epoch": 0.16, "learning_rate": 4.779997892824182e-06, "loss": 1.1, "step": 5328 }, { "epoch": 0.16, "learning_rate": 4.779897827901665e-06, "loss": 1.1573, "step": 5329 }, { "epoch": 0.16, "learning_rate": 4.77979774127562e-06, "loss": 1.1453, "step": 5330 }, { "epoch": 0.16, "learning_rate": 4.779697632946998e-06, "loss": 1.1511, "step": 5331 }, { "epoch": 0.16, "learning_rate": 4.779597502916753e-06, "loss": 1.1876, "step": 5332 }, { "epoch": 0.16, "learning_rate": 4.779497351185838e-06, "loss": 1.2491, "step": 5333 }, { "epoch": 0.16, "learning_rate": 4.779397177755205e-06, "loss": 1.1668, "step": 5334 }, { "epoch": 0.16, "learning_rate": 4.7792969826258095e-06, "loss": 1.1007, "step": 5335 }, { "epoch": 0.16, "learning_rate": 4.779196765798604e-06, "loss": 1.0799, "step": 5336 }, { "epoch": 0.16, "learning_rate": 4.779096527274542e-06, "loss": 1.1678, "step": 5337 }, { "epoch": 0.16, "learning_rate": 4.778996267054581e-06, "loss": 1.1607, "step": 5338 }, { "epoch": 0.16, "learning_rate": 4.778895985139672e-06, "loss": 1.0276, "step": 5339 }, { "epoch": 0.16, "learning_rate": 4.77879568153077e-06, "loss": 1.2162, "step": 5340 }, { "epoch": 0.16, "learning_rate": 4.778695356228832e-06, "loss": 1.1226, "step": 5341 }, { "epoch": 0.16, "learning_rate": 4.778595009234811e-06, "loss": 1.1016, "step": 5342 }, { "epoch": 0.16, "learning_rate": 4.778494640549663e-06, "loss": 1.1871, "step": 5343 }, { "epoch": 0.16, "learning_rate": 4.778394250174343e-06, "loss": 1.2682, "step": 5344 }, { "epoch": 0.16, "learning_rate": 4.778293838109807e-06, "loss": 1.1648, "step": 5345 }, { "epoch": 0.16, "learning_rate": 4.778193404357011e-06, "loss": 1.1085, "step": 5346 }, { "epoch": 0.16, "learning_rate": 4.778092948916912e-06, "loss": 1.152, "step": 5347 }, { "epoch": 0.16, "learning_rate": 4.777992471790465e-06, "loss": 1.2927, "step": 5348 }, { "epoch": 0.16, "learning_rate": 4.777891972978625e-06, "loss": 1.1566, "step": 5349 }, { "epoch": 0.16, "learning_rate": 4.777791452482352e-06, "loss": 1.151, "step": 5350 }, { "epoch": 0.16, "learning_rate": 4.777690910302601e-06, "loss": 1.2119, "step": 5351 }, { "epoch": 0.16, "learning_rate": 4.77759034644033e-06, "loss": 1.1797, "step": 5352 }, { "epoch": 0.16, "learning_rate": 4.777489760896496e-06, "loss": 1.1379, "step": 5353 }, { "epoch": 0.16, "learning_rate": 4.777389153672056e-06, "loss": 1.3248, "step": 5354 }, { "epoch": 0.16, "learning_rate": 4.777288524767968e-06, "loss": 1.2123, "step": 5355 }, { "epoch": 0.16, "learning_rate": 4.77718787418519e-06, "loss": 1.2628, "step": 5356 }, { "epoch": 0.16, "learning_rate": 4.77708720192468e-06, "loss": 1.1442, "step": 5357 }, { "epoch": 0.16, "learning_rate": 4.776986507987397e-06, "loss": 1.0754, "step": 5358 }, { "epoch": 0.16, "learning_rate": 4.776885792374298e-06, "loss": 1.1536, "step": 5359 }, { "epoch": 0.16, "learning_rate": 4.776785055086344e-06, "loss": 1.1243, "step": 5360 }, { "epoch": 0.16, "learning_rate": 4.776684296124493e-06, "loss": 1.2088, "step": 5361 }, { "epoch": 0.16, "learning_rate": 4.776583515489703e-06, "loss": 1.0699, "step": 5362 }, { "epoch": 0.16, "learning_rate": 4.776482713182935e-06, "loss": 1.0712, "step": 5363 }, { "epoch": 0.16, "learning_rate": 4.7763818892051475e-06, "loss": 1.0496, "step": 5364 }, { "epoch": 0.16, "learning_rate": 4.776281043557301e-06, "loss": 1.1468, "step": 5365 }, { "epoch": 0.16, "learning_rate": 4.776180176240356e-06, "loss": 1.1855, "step": 5366 }, { "epoch": 0.16, "learning_rate": 4.776079287255271e-06, "loss": 1.2054, "step": 5367 }, { "epoch": 0.16, "learning_rate": 4.775978376603008e-06, "loss": 1.0211, "step": 5368 }, { "epoch": 0.16, "learning_rate": 4.775877444284525e-06, "loss": 1.1472, "step": 5369 }, { "epoch": 0.16, "learning_rate": 4.7757764903007875e-06, "loss": 1.1555, "step": 5370 }, { "epoch": 0.16, "learning_rate": 4.775675514652753e-06, "loss": 1.1387, "step": 5371 }, { "epoch": 0.16, "learning_rate": 4.775574517341383e-06, "loss": 1.0247, "step": 5372 }, { "epoch": 0.16, "learning_rate": 4.775473498367641e-06, "loss": 1.2135, "step": 5373 }, { "epoch": 0.16, "learning_rate": 4.775372457732486e-06, "loss": 1.197, "step": 5374 }, { "epoch": 0.16, "learning_rate": 4.7752713954368805e-06, "loss": 1.1605, "step": 5375 }, { "epoch": 0.16, "learning_rate": 4.775170311481788e-06, "loss": 1.147, "step": 5376 }, { "epoch": 0.16, "learning_rate": 4.77506920586817e-06, "loss": 1.1115, "step": 5377 }, { "epoch": 0.16, "learning_rate": 4.7749680785969885e-06, "loss": 1.1384, "step": 5378 }, { "epoch": 0.16, "learning_rate": 4.7748669296692064e-06, "loss": 1.1132, "step": 5379 }, { "epoch": 0.16, "learning_rate": 4.774765759085788e-06, "loss": 1.1562, "step": 5380 }, { "epoch": 0.16, "learning_rate": 4.774664566847693e-06, "loss": 0.9844, "step": 5381 }, { "epoch": 0.16, "learning_rate": 4.7745633529558886e-06, "loss": 1.0771, "step": 5382 }, { "epoch": 0.16, "learning_rate": 4.774462117411336e-06, "loss": 1.1809, "step": 5383 }, { "epoch": 0.16, "learning_rate": 4.774360860214999e-06, "loss": 1.0482, "step": 5384 }, { "epoch": 0.16, "learning_rate": 4.774259581367843e-06, "loss": 1.1602, "step": 5385 }, { "epoch": 0.16, "learning_rate": 4.774158280870831e-06, "loss": 1.2123, "step": 5386 }, { "epoch": 0.16, "learning_rate": 4.774056958724926e-06, "loss": 1.0468, "step": 5387 }, { "epoch": 0.16, "learning_rate": 4.773955614931095e-06, "loss": 1.1891, "step": 5388 }, { "epoch": 0.16, "learning_rate": 4.773854249490302e-06, "loss": 1.187, "step": 5389 }, { "epoch": 0.16, "learning_rate": 4.7737528624035115e-06, "loss": 1.0966, "step": 5390 }, { "epoch": 0.16, "learning_rate": 4.773651453671688e-06, "loss": 1.106, "step": 5391 }, { "epoch": 0.16, "learning_rate": 4.773550023295799e-06, "loss": 1.19, "step": 5392 }, { "epoch": 0.16, "learning_rate": 4.773448571276808e-06, "loss": 1.1473, "step": 5393 }, { "epoch": 0.16, "learning_rate": 4.773347097615682e-06, "loss": 1.1584, "step": 5394 }, { "epoch": 0.16, "learning_rate": 4.773245602313386e-06, "loss": 1.1149, "step": 5395 }, { "epoch": 0.16, "learning_rate": 4.773144085370887e-06, "loss": 1.1511, "step": 5396 }, { "epoch": 0.16, "learning_rate": 4.773042546789151e-06, "loss": 1.2075, "step": 5397 }, { "epoch": 0.16, "learning_rate": 4.772940986569144e-06, "loss": 1.1573, "step": 5398 }, { "epoch": 0.16, "learning_rate": 4.772839404711834e-06, "loss": 1.1473, "step": 5399 }, { "epoch": 0.16, "learning_rate": 4.772737801218188e-06, "loss": 1.1362, "step": 5400 }, { "epoch": 0.16, "learning_rate": 4.772636176089172e-06, "loss": 1.2113, "step": 5401 }, { "epoch": 0.16, "learning_rate": 4.772534529325754e-06, "loss": 1.1597, "step": 5402 }, { "epoch": 0.16, "learning_rate": 4.7724328609289025e-06, "loss": 1.1023, "step": 5403 }, { "epoch": 0.16, "learning_rate": 4.772331170899585e-06, "loss": 1.1264, "step": 5404 }, { "epoch": 0.16, "learning_rate": 4.772229459238768e-06, "loss": 1.1823, "step": 5405 }, { "epoch": 0.16, "learning_rate": 4.772127725947422e-06, "loss": 1.1116, "step": 5406 }, { "epoch": 0.16, "learning_rate": 4.7720259710265135e-06, "loss": 1.2021, "step": 5407 }, { "epoch": 0.16, "learning_rate": 4.771924194477012e-06, "loss": 1.1749, "step": 5408 }, { "epoch": 0.16, "learning_rate": 4.771822396299886e-06, "loss": 1.1956, "step": 5409 }, { "epoch": 0.16, "learning_rate": 4.771720576496106e-06, "loss": 1.0889, "step": 5410 }, { "epoch": 0.16, "learning_rate": 4.7716187350666395e-06, "loss": 1.1818, "step": 5411 }, { "epoch": 0.16, "learning_rate": 4.7715168720124575e-06, "loss": 1.3383, "step": 5412 }, { "epoch": 0.16, "learning_rate": 4.771414987334528e-06, "loss": 1.2205, "step": 5413 }, { "epoch": 0.16, "learning_rate": 4.771313081033822e-06, "loss": 1.227, "step": 5414 }, { "epoch": 0.16, "learning_rate": 4.771211153111309e-06, "loss": 1.1069, "step": 5415 }, { "epoch": 0.16, "learning_rate": 4.7711092035679606e-06, "loss": 1.1944, "step": 5416 }, { "epoch": 0.16, "learning_rate": 4.771007232404746e-06, "loss": 1.0537, "step": 5417 }, { "epoch": 0.16, "learning_rate": 4.7709052396226365e-06, "loss": 1.2496, "step": 5418 }, { "epoch": 0.16, "learning_rate": 4.770803225222602e-06, "loss": 1.0325, "step": 5419 }, { "epoch": 0.16, "learning_rate": 4.7707011892056154e-06, "loss": 1.1899, "step": 5420 }, { "epoch": 0.16, "learning_rate": 4.770599131572646e-06, "loss": 1.0698, "step": 5421 }, { "epoch": 0.16, "learning_rate": 4.770497052324667e-06, "loss": 1.1249, "step": 5422 }, { "epoch": 0.16, "learning_rate": 4.77039495146265e-06, "loss": 1.1851, "step": 5423 }, { "epoch": 0.16, "learning_rate": 4.7702928289875664e-06, "loss": 1.2783, "step": 5424 }, { "epoch": 0.16, "learning_rate": 4.7701906849003886e-06, "loss": 1.1509, "step": 5425 }, { "epoch": 0.16, "learning_rate": 4.770088519202088e-06, "loss": 1.2329, "step": 5426 }, { "epoch": 0.16, "learning_rate": 4.769986331893639e-06, "loss": 1.1951, "step": 5427 }, { "epoch": 0.16, "learning_rate": 4.769884122976013e-06, "loss": 1.118, "step": 5428 }, { "epoch": 0.16, "learning_rate": 4.769781892450182e-06, "loss": 1.1973, "step": 5429 }, { "epoch": 0.16, "learning_rate": 4.769679640317123e-06, "loss": 1.2823, "step": 5430 }, { "epoch": 0.16, "learning_rate": 4.7695773665778055e-06, "loss": 1.0839, "step": 5431 }, { "epoch": 0.16, "learning_rate": 4.769475071233205e-06, "loss": 1.2162, "step": 5432 }, { "epoch": 0.16, "learning_rate": 4.769372754284294e-06, "loss": 1.1572, "step": 5433 }, { "epoch": 0.16, "learning_rate": 4.769270415732048e-06, "loss": 1.1249, "step": 5434 }, { "epoch": 0.16, "learning_rate": 4.769168055577441e-06, "loss": 1.1385, "step": 5435 }, { "epoch": 0.16, "learning_rate": 4.769065673821447e-06, "loss": 1.2587, "step": 5436 }, { "epoch": 0.16, "learning_rate": 4.768963270465039e-06, "loss": 1.3349, "step": 5437 }, { "epoch": 0.16, "learning_rate": 4.768860845509196e-06, "loss": 1.1644, "step": 5438 }, { "epoch": 0.16, "learning_rate": 4.768758398954888e-06, "loss": 1.1409, "step": 5439 }, { "epoch": 0.16, "learning_rate": 4.768655930803095e-06, "loss": 1.183, "step": 5440 }, { "epoch": 0.16, "learning_rate": 4.768553441054788e-06, "loss": 1.0802, "step": 5441 }, { "epoch": 0.16, "learning_rate": 4.768450929710946e-06, "loss": 1.1511, "step": 5442 }, { "epoch": 0.16, "learning_rate": 4.768348396772543e-06, "loss": 1.1215, "step": 5443 }, { "epoch": 0.16, "learning_rate": 4.768245842240556e-06, "loss": 1.2521, "step": 5444 }, { "epoch": 0.16, "learning_rate": 4.768143266115961e-06, "loss": 1.1791, "step": 5445 }, { "epoch": 0.16, "learning_rate": 4.768040668399735e-06, "loss": 1.1354, "step": 5446 }, { "epoch": 0.16, "learning_rate": 4.767938049092854e-06, "loss": 1.1523, "step": 5447 }, { "epoch": 0.16, "learning_rate": 4.767835408196295e-06, "loss": 1.0944, "step": 5448 }, { "epoch": 0.16, "learning_rate": 4.767732745711035e-06, "loss": 1.2213, "step": 5449 }, { "epoch": 0.16, "learning_rate": 4.767630061638051e-06, "loss": 1.2251, "step": 5450 }, { "epoch": 0.16, "learning_rate": 4.767527355978321e-06, "loss": 1.0949, "step": 5451 }, { "epoch": 0.16, "learning_rate": 4.767424628732823e-06, "loss": 1.1921, "step": 5452 }, { "epoch": 0.16, "learning_rate": 4.767321879902534e-06, "loss": 1.1176, "step": 5453 }, { "epoch": 0.16, "learning_rate": 4.767219109488434e-06, "loss": 1.1275, "step": 5454 }, { "epoch": 0.16, "learning_rate": 4.767116317491499e-06, "loss": 1.2115, "step": 5455 }, { "epoch": 0.16, "learning_rate": 4.767013503912709e-06, "loss": 1.2869, "step": 5456 }, { "epoch": 0.16, "learning_rate": 4.766910668753042e-06, "loss": 1.2646, "step": 5457 }, { "epoch": 0.16, "learning_rate": 4.766807812013478e-06, "loss": 1.1493, "step": 5458 }, { "epoch": 0.16, "learning_rate": 4.766704933694994e-06, "loss": 1.1353, "step": 5459 }, { "epoch": 0.16, "learning_rate": 4.766602033798572e-06, "loss": 1.2301, "step": 5460 }, { "epoch": 0.16, "learning_rate": 4.766499112325189e-06, "loss": 1.1783, "step": 5461 }, { "epoch": 0.16, "learning_rate": 4.766396169275827e-06, "loss": 1.1494, "step": 5462 }, { "epoch": 0.16, "learning_rate": 4.766293204651464e-06, "loss": 1.1046, "step": 5463 }, { "epoch": 0.16, "learning_rate": 4.766190218453082e-06, "loss": 1.1412, "step": 5464 }, { "epoch": 0.16, "learning_rate": 4.766087210681661e-06, "loss": 1.1451, "step": 5465 }, { "epoch": 0.16, "learning_rate": 4.76598418133818e-06, "loss": 1.1232, "step": 5466 }, { "epoch": 0.16, "learning_rate": 4.765881130423622e-06, "loss": 1.0959, "step": 5467 }, { "epoch": 0.16, "learning_rate": 4.765778057938966e-06, "loss": 1.1891, "step": 5468 }, { "epoch": 0.16, "learning_rate": 4.765674963885194e-06, "loss": 1.1757, "step": 5469 }, { "epoch": 0.16, "learning_rate": 4.7655718482632884e-06, "loss": 1.1753, "step": 5470 }, { "epoch": 0.16, "learning_rate": 4.76546871107423e-06, "loss": 1.0906, "step": 5471 }, { "epoch": 0.16, "learning_rate": 4.765365552319e-06, "loss": 1.0641, "step": 5472 }, { "epoch": 0.16, "learning_rate": 4.7652623719985814e-06, "loss": 1.0712, "step": 5473 }, { "epoch": 0.16, "learning_rate": 4.765159170113955e-06, "loss": 1.2418, "step": 5474 }, { "epoch": 0.16, "learning_rate": 4.7650559466661054e-06, "loss": 1.2037, "step": 5475 }, { "epoch": 0.16, "learning_rate": 4.764952701656014e-06, "loss": 1.1654, "step": 5476 }, { "epoch": 0.16, "learning_rate": 4.764849435084663e-06, "loss": 1.1675, "step": 5477 }, { "epoch": 0.17, "learning_rate": 4.764746146953036e-06, "loss": 1.0486, "step": 5478 }, { "epoch": 0.17, "learning_rate": 4.764642837262118e-06, "loss": 1.1371, "step": 5479 }, { "epoch": 0.17, "learning_rate": 4.76453950601289e-06, "loss": 1.1205, "step": 5480 }, { "epoch": 0.17, "learning_rate": 4.764436153206335e-06, "loss": 1.1147, "step": 5481 }, { "epoch": 0.17, "learning_rate": 4.76433277884344e-06, "loss": 1.163, "step": 5482 }, { "epoch": 0.17, "learning_rate": 4.764229382925187e-06, "loss": 1.1936, "step": 5483 }, { "epoch": 0.17, "learning_rate": 4.764125965452562e-06, "loss": 1.1791, "step": 5484 }, { "epoch": 0.17, "learning_rate": 4.764022526426547e-06, "loss": 1.0843, "step": 5485 }, { "epoch": 0.17, "learning_rate": 4.7639190658481284e-06, "loss": 1.2407, "step": 5486 }, { "epoch": 0.17, "learning_rate": 4.76381558371829e-06, "loss": 1.2131, "step": 5487 }, { "epoch": 0.17, "learning_rate": 4.763712080038018e-06, "loss": 1.171, "step": 5488 }, { "epoch": 0.17, "learning_rate": 4.763608554808298e-06, "loss": 1.1984, "step": 5489 }, { "epoch": 0.17, "learning_rate": 4.7635050080301135e-06, "loss": 0.9995, "step": 5490 }, { "epoch": 0.17, "learning_rate": 4.763401439704452e-06, "loss": 0.9451, "step": 5491 }, { "epoch": 0.17, "learning_rate": 4.763297849832299e-06, "loss": 1.239, "step": 5492 }, { "epoch": 0.17, "learning_rate": 4.7631942384146405e-06, "loss": 1.1317, "step": 5493 }, { "epoch": 0.17, "learning_rate": 4.763090605452462e-06, "loss": 1.1398, "step": 5494 }, { "epoch": 0.17, "learning_rate": 4.762986950946752e-06, "loss": 1.1049, "step": 5495 }, { "epoch": 0.17, "learning_rate": 4.762883274898495e-06, "loss": 1.1964, "step": 5496 }, { "epoch": 0.17, "learning_rate": 4.76277957730868e-06, "loss": 1.1031, "step": 5497 }, { "epoch": 0.17, "learning_rate": 4.762675858178293e-06, "loss": 1.0951, "step": 5498 }, { "epoch": 0.17, "learning_rate": 4.762572117508322e-06, "loss": 1.1815, "step": 5499 }, { "epoch": 0.17, "learning_rate": 4.762468355299753e-06, "loss": 1.1891, "step": 5500 }, { "epoch": 0.17, "learning_rate": 4.762364571553576e-06, "loss": 1.1494, "step": 5501 }, { "epoch": 0.17, "learning_rate": 4.762260766270777e-06, "loss": 1.0777, "step": 5502 }, { "epoch": 0.17, "learning_rate": 4.762156939452346e-06, "loss": 1.1251, "step": 5503 }, { "epoch": 0.17, "learning_rate": 4.7620530910992705e-06, "loss": 1.0833, "step": 5504 }, { "epoch": 0.17, "learning_rate": 4.761949221212538e-06, "loss": 1.2542, "step": 5505 }, { "epoch": 0.17, "learning_rate": 4.761845329793139e-06, "loss": 1.1104, "step": 5506 }, { "epoch": 0.17, "learning_rate": 4.761741416842061e-06, "loss": 1.1059, "step": 5507 }, { "epoch": 0.17, "learning_rate": 4.7616374823602944e-06, "loss": 1.1764, "step": 5508 }, { "epoch": 0.17, "learning_rate": 4.761533526348828e-06, "loss": 1.1451, "step": 5509 }, { "epoch": 0.17, "learning_rate": 4.761429548808653e-06, "loss": 1.0889, "step": 5510 }, { "epoch": 0.17, "learning_rate": 4.7613255497407564e-06, "loss": 1.1285, "step": 5511 }, { "epoch": 0.17, "learning_rate": 4.76122152914613e-06, "loss": 1.2294, "step": 5512 }, { "epoch": 0.17, "learning_rate": 4.761117487025764e-06, "loss": 1.0236, "step": 5513 }, { "epoch": 0.17, "learning_rate": 4.761013423380648e-06, "loss": 1.0816, "step": 5514 }, { "epoch": 0.17, "learning_rate": 4.760909338211773e-06, "loss": 1.2247, "step": 5515 }, { "epoch": 0.17, "learning_rate": 4.760805231520131e-06, "loss": 1.0948, "step": 5516 }, { "epoch": 0.17, "learning_rate": 4.760701103306711e-06, "loss": 1.1859, "step": 5517 }, { "epoch": 0.17, "learning_rate": 4.760596953572506e-06, "loss": 1.1523, "step": 5518 }, { "epoch": 0.17, "learning_rate": 4.760492782318506e-06, "loss": 1.222, "step": 5519 }, { "epoch": 0.17, "learning_rate": 4.7603885895457046e-06, "loss": 1.2451, "step": 5520 }, { "epoch": 0.17, "learning_rate": 4.760284375255091e-06, "loss": 1.1495, "step": 5521 }, { "epoch": 0.17, "learning_rate": 4.76018013944766e-06, "loss": 1.1998, "step": 5522 }, { "epoch": 0.17, "learning_rate": 4.760075882124402e-06, "loss": 1.1263, "step": 5523 }, { "epoch": 0.17, "learning_rate": 4.7599716032863104e-06, "loss": 1.1927, "step": 5524 }, { "epoch": 0.17, "learning_rate": 4.759867302934377e-06, "loss": 1.0515, "step": 5525 }, { "epoch": 0.17, "learning_rate": 4.759762981069596e-06, "loss": 1.1926, "step": 5526 }, { "epoch": 0.17, "learning_rate": 4.7596586376929595e-06, "loss": 1.1282, "step": 5527 }, { "epoch": 0.17, "learning_rate": 4.759554272805461e-06, "loss": 1.115, "step": 5528 }, { "epoch": 0.17, "learning_rate": 4.759449886408094e-06, "loss": 1.028, "step": 5529 }, { "epoch": 0.17, "learning_rate": 4.759345478501852e-06, "loss": 1.0951, "step": 5530 }, { "epoch": 0.17, "learning_rate": 4.759241049087729e-06, "loss": 1.1705, "step": 5531 }, { "epoch": 0.17, "learning_rate": 4.7591365981667205e-06, "loss": 1.1973, "step": 5532 }, { "epoch": 0.17, "learning_rate": 4.759032125739819e-06, "loss": 1.1824, "step": 5533 }, { "epoch": 0.17, "learning_rate": 4.758927631808019e-06, "loss": 1.1444, "step": 5534 }, { "epoch": 0.17, "learning_rate": 4.758823116372316e-06, "loss": 1.1345, "step": 5535 }, { "epoch": 0.17, "learning_rate": 4.758718579433705e-06, "loss": 1.2357, "step": 5536 }, { "epoch": 0.17, "learning_rate": 4.758614020993182e-06, "loss": 1.1138, "step": 5537 }, { "epoch": 0.17, "learning_rate": 4.758509441051741e-06, "loss": 1.0947, "step": 5538 }, { "epoch": 0.17, "learning_rate": 4.7584048396103765e-06, "loss": 1.16, "step": 5539 }, { "epoch": 0.17, "learning_rate": 4.758300216670087e-06, "loss": 1.1573, "step": 5540 }, { "epoch": 0.17, "learning_rate": 4.758195572231866e-06, "loss": 1.3029, "step": 5541 }, { "epoch": 0.17, "learning_rate": 4.7580909062967115e-06, "loss": 1.1651, "step": 5542 }, { "epoch": 0.17, "learning_rate": 4.757986218865619e-06, "loss": 1.2864, "step": 5543 }, { "epoch": 0.17, "learning_rate": 4.757881509939584e-06, "loss": 1.1047, "step": 5544 }, { "epoch": 0.17, "learning_rate": 4.757776779519607e-06, "loss": 1.1647, "step": 5545 }, { "epoch": 0.17, "learning_rate": 4.757672027606681e-06, "loss": 1.1021, "step": 5546 }, { "epoch": 0.17, "learning_rate": 4.757567254201804e-06, "loss": 1.1719, "step": 5547 }, { "epoch": 0.17, "learning_rate": 4.757462459305975e-06, "loss": 1.0784, "step": 5548 }, { "epoch": 0.17, "learning_rate": 4.75735764292019e-06, "loss": 1.1243, "step": 5549 }, { "epoch": 0.17, "learning_rate": 4.757252805045448e-06, "loss": 1.2317, "step": 5550 }, { "epoch": 0.17, "learning_rate": 4.757147945682746e-06, "loss": 1.1694, "step": 5551 }, { "epoch": 0.17, "learning_rate": 4.757043064833082e-06, "loss": 1.1854, "step": 5552 }, { "epoch": 0.17, "learning_rate": 4.756938162497457e-06, "loss": 1.1379, "step": 5553 }, { "epoch": 0.17, "learning_rate": 4.756833238676865e-06, "loss": 1.3041, "step": 5554 }, { "epoch": 0.17, "learning_rate": 4.75672829337231e-06, "loss": 1.2023, "step": 5555 }, { "epoch": 0.17, "learning_rate": 4.756623326584787e-06, "loss": 1.2273, "step": 5556 }, { "epoch": 0.17, "learning_rate": 4.756518338315297e-06, "loss": 1.2153, "step": 5557 }, { "epoch": 0.17, "learning_rate": 4.75641332856484e-06, "loss": 1.1773, "step": 5558 }, { "epoch": 0.17, "learning_rate": 4.756308297334414e-06, "loss": 1.0905, "step": 5559 }, { "epoch": 0.17, "learning_rate": 4.75620324462502e-06, "loss": 1.1643, "step": 5560 }, { "epoch": 0.17, "learning_rate": 4.756098170437658e-06, "loss": 1.0793, "step": 5561 }, { "epoch": 0.17, "learning_rate": 4.7559930747733275e-06, "loss": 1.2568, "step": 5562 }, { "epoch": 0.17, "learning_rate": 4.75588795763303e-06, "loss": 1.1686, "step": 5563 }, { "epoch": 0.17, "learning_rate": 4.755782819017765e-06, "loss": 1.1465, "step": 5564 }, { "epoch": 0.17, "learning_rate": 4.755677658928534e-06, "loss": 1.1726, "step": 5565 }, { "epoch": 0.17, "learning_rate": 4.755572477366338e-06, "loss": 1.1271, "step": 5566 }, { "epoch": 0.17, "learning_rate": 4.7554672743321785e-06, "loss": 1.1533, "step": 5567 }, { "epoch": 0.17, "learning_rate": 4.755362049827057e-06, "loss": 1.131, "step": 5568 }, { "epoch": 0.17, "learning_rate": 4.7552568038519755e-06, "loss": 1.1957, "step": 5569 }, { "epoch": 0.17, "learning_rate": 4.755151536407935e-06, "loss": 1.1061, "step": 5570 }, { "epoch": 0.17, "learning_rate": 4.755046247495937e-06, "loss": 1.019, "step": 5571 }, { "epoch": 0.17, "learning_rate": 4.754940937116986e-06, "loss": 1.1337, "step": 5572 }, { "epoch": 0.17, "learning_rate": 4.754835605272083e-06, "loss": 1.1583, "step": 5573 }, { "epoch": 0.17, "learning_rate": 4.75473025196223e-06, "loss": 1.148, "step": 5574 }, { "epoch": 0.17, "learning_rate": 4.754624877188433e-06, "loss": 1.1705, "step": 5575 }, { "epoch": 0.17, "learning_rate": 4.754519480951692e-06, "loss": 1.0773, "step": 5576 }, { "epoch": 0.17, "learning_rate": 4.754414063253011e-06, "loss": 1.2249, "step": 5577 }, { "epoch": 0.17, "learning_rate": 4.754308624093393e-06, "loss": 1.1351, "step": 5578 }, { "epoch": 0.17, "learning_rate": 4.7542031634738445e-06, "loss": 1.261, "step": 5579 }, { "epoch": 0.17, "learning_rate": 4.7540976813953665e-06, "loss": 1.0437, "step": 5580 }, { "epoch": 0.17, "learning_rate": 4.753992177858965e-06, "loss": 1.2554, "step": 5581 }, { "epoch": 0.17, "learning_rate": 4.753886652865642e-06, "loss": 1.1823, "step": 5582 }, { "epoch": 0.17, "learning_rate": 4.753781106416406e-06, "loss": 1.1661, "step": 5583 }, { "epoch": 0.17, "learning_rate": 4.753675538512257e-06, "loss": 1.1055, "step": 5584 }, { "epoch": 0.17, "learning_rate": 4.753569949154203e-06, "loss": 1.0463, "step": 5585 }, { "epoch": 0.17, "learning_rate": 4.753464338343249e-06, "loss": 1.334, "step": 5586 }, { "epoch": 0.17, "learning_rate": 4.7533587060803995e-06, "loss": 1.177, "step": 5587 }, { "epoch": 0.17, "learning_rate": 4.75325305236666e-06, "loss": 1.1965, "step": 5588 }, { "epoch": 0.17, "learning_rate": 4.753147377203037e-06, "loss": 1.2778, "step": 5589 }, { "epoch": 0.17, "learning_rate": 4.753041680590536e-06, "loss": 1.0715, "step": 5590 }, { "epoch": 0.17, "learning_rate": 4.752935962530163e-06, "loss": 1.1509, "step": 5591 }, { "epoch": 0.17, "learning_rate": 4.7528302230229255e-06, "loss": 1.0578, "step": 5592 }, { "epoch": 0.17, "learning_rate": 4.752724462069829e-06, "loss": 1.1758, "step": 5593 }, { "epoch": 0.17, "learning_rate": 4.75261867967188e-06, "loss": 1.101, "step": 5594 }, { "epoch": 0.17, "learning_rate": 4.752512875830086e-06, "loss": 1.2196, "step": 5595 }, { "epoch": 0.17, "learning_rate": 4.752407050545455e-06, "loss": 1.1905, "step": 5596 }, { "epoch": 0.17, "learning_rate": 4.752301203818993e-06, "loss": 1.0438, "step": 5597 }, { "epoch": 0.17, "learning_rate": 4.752195335651709e-06, "loss": 1.0852, "step": 5598 }, { "epoch": 0.17, "learning_rate": 4.75208944604461e-06, "loss": 1.0823, "step": 5599 }, { "epoch": 0.17, "learning_rate": 4.7519835349987045e-06, "loss": 1.1755, "step": 5600 }, { "epoch": 0.17, "learning_rate": 4.7518776025149995e-06, "loss": 1.1517, "step": 5601 }, { "epoch": 0.17, "learning_rate": 4.751771648594504e-06, "loss": 1.1878, "step": 5602 }, { "epoch": 0.17, "learning_rate": 4.751665673238227e-06, "loss": 1.1071, "step": 5603 }, { "epoch": 0.17, "learning_rate": 4.7515596764471786e-06, "loss": 1.26, "step": 5604 }, { "epoch": 0.17, "learning_rate": 4.751453658222364e-06, "loss": 1.1903, "step": 5605 }, { "epoch": 0.17, "learning_rate": 4.751347618564798e-06, "loss": 1.1828, "step": 5606 }, { "epoch": 0.17, "learning_rate": 4.751241557475485e-06, "loss": 1.1083, "step": 5607 }, { "epoch": 0.17, "learning_rate": 4.751135474955437e-06, "loss": 1.2148, "step": 5608 }, { "epoch": 0.17, "learning_rate": 4.751029371005663e-06, "loss": 1.1254, "step": 5609 }, { "epoch": 0.17, "learning_rate": 4.750923245627175e-06, "loss": 1.1856, "step": 5610 }, { "epoch": 0.17, "learning_rate": 4.75081709882098e-06, "loss": 1.2283, "step": 5611 }, { "epoch": 0.17, "learning_rate": 4.7507109305880905e-06, "loss": 1.0801, "step": 5612 }, { "epoch": 0.17, "learning_rate": 4.7506047409295176e-06, "loss": 1.1501, "step": 5613 }, { "epoch": 0.17, "learning_rate": 4.750498529846271e-06, "loss": 1.1226, "step": 5614 }, { "epoch": 0.17, "learning_rate": 4.750392297339363e-06, "loss": 1.1188, "step": 5615 }, { "epoch": 0.17, "learning_rate": 4.750286043409803e-06, "loss": 1.1716, "step": 5616 }, { "epoch": 0.17, "learning_rate": 4.750179768058605e-06, "loss": 1.2239, "step": 5617 }, { "epoch": 0.17, "learning_rate": 4.750073471286779e-06, "loss": 1.2557, "step": 5618 }, { "epoch": 0.17, "learning_rate": 4.749967153095337e-06, "loss": 1.1658, "step": 5619 }, { "epoch": 0.17, "learning_rate": 4.749860813485291e-06, "loss": 1.1968, "step": 5620 }, { "epoch": 0.17, "learning_rate": 4.749754452457654e-06, "loss": 1.0991, "step": 5621 }, { "epoch": 0.17, "learning_rate": 4.749648070013438e-06, "loss": 1.0633, "step": 5622 }, { "epoch": 0.17, "learning_rate": 4.749541666153655e-06, "loss": 1.0375, "step": 5623 }, { "epoch": 0.17, "learning_rate": 4.749435240879321e-06, "loss": 1.2314, "step": 5624 }, { "epoch": 0.17, "learning_rate": 4.749328794191444e-06, "loss": 1.2667, "step": 5625 }, { "epoch": 0.17, "learning_rate": 4.7492223260910426e-06, "loss": 1.2006, "step": 5626 }, { "epoch": 0.17, "learning_rate": 4.749115836579127e-06, "loss": 1.0361, "step": 5627 }, { "epoch": 0.17, "learning_rate": 4.749009325656712e-06, "loss": 1.0674, "step": 5628 }, { "epoch": 0.17, "learning_rate": 4.748902793324811e-06, "loss": 1.2126, "step": 5629 }, { "epoch": 0.17, "learning_rate": 4.748796239584438e-06, "loss": 1.2399, "step": 5630 }, { "epoch": 0.17, "learning_rate": 4.748689664436609e-06, "loss": 1.2193, "step": 5631 }, { "epoch": 0.17, "learning_rate": 4.748583067882337e-06, "loss": 1.1544, "step": 5632 }, { "epoch": 0.17, "learning_rate": 4.748476449922637e-06, "loss": 1.1277, "step": 5633 }, { "epoch": 0.17, "learning_rate": 4.748369810558524e-06, "loss": 1.0797, "step": 5634 }, { "epoch": 0.17, "learning_rate": 4.7482631497910135e-06, "loss": 1.1199, "step": 5635 }, { "epoch": 0.17, "learning_rate": 4.748156467621121e-06, "loss": 1.1504, "step": 5636 }, { "epoch": 0.17, "learning_rate": 4.748049764049861e-06, "loss": 1.2773, "step": 5637 }, { "epoch": 0.17, "learning_rate": 4.7479430390782504e-06, "loss": 1.0963, "step": 5638 }, { "epoch": 0.17, "learning_rate": 4.747836292707304e-06, "loss": 1.1708, "step": 5639 }, { "epoch": 0.17, "learning_rate": 4.74772952493804e-06, "loss": 1.1245, "step": 5640 }, { "epoch": 0.17, "learning_rate": 4.747622735771473e-06, "loss": 1.1228, "step": 5641 }, { "epoch": 0.17, "learning_rate": 4.747515925208619e-06, "loss": 1.2231, "step": 5642 }, { "epoch": 0.17, "learning_rate": 4.747409093250497e-06, "loss": 1.0825, "step": 5643 }, { "epoch": 0.17, "learning_rate": 4.747302239898122e-06, "loss": 1.2039, "step": 5644 }, { "epoch": 0.17, "learning_rate": 4.747195365152513e-06, "loss": 1.1577, "step": 5645 }, { "epoch": 0.17, "learning_rate": 4.747088469014685e-06, "loss": 1.1284, "step": 5646 }, { "epoch": 0.17, "learning_rate": 4.746981551485659e-06, "loss": 1.1266, "step": 5647 }, { "epoch": 0.17, "learning_rate": 4.746874612566449e-06, "loss": 1.2972, "step": 5648 }, { "epoch": 0.17, "learning_rate": 4.746767652258075e-06, "loss": 1.173, "step": 5649 }, { "epoch": 0.17, "learning_rate": 4.746660670561556e-06, "loss": 1.1385, "step": 5650 }, { "epoch": 0.17, "learning_rate": 4.746553667477909e-06, "loss": 1.0917, "step": 5651 }, { "epoch": 0.17, "learning_rate": 4.746446643008153e-06, "loss": 1.1332, "step": 5652 }, { "epoch": 0.17, "learning_rate": 4.746339597153306e-06, "loss": 1.0562, "step": 5653 }, { "epoch": 0.17, "learning_rate": 4.74623252991439e-06, "loss": 1.1658, "step": 5654 }, { "epoch": 0.17, "learning_rate": 4.746125441292421e-06, "loss": 1.0948, "step": 5655 }, { "epoch": 0.17, "learning_rate": 4.746018331288419e-06, "loss": 1.2433, "step": 5656 }, { "epoch": 0.17, "learning_rate": 4.745911199903405e-06, "loss": 1.1439, "step": 5657 }, { "epoch": 0.17, "learning_rate": 4.745804047138398e-06, "loss": 1.1919, "step": 5658 }, { "epoch": 0.17, "learning_rate": 4.745696872994417e-06, "loss": 1.0989, "step": 5659 }, { "epoch": 0.17, "learning_rate": 4.745589677472485e-06, "loss": 1.1573, "step": 5660 }, { "epoch": 0.17, "learning_rate": 4.745482460573619e-06, "loss": 1.0975, "step": 5661 }, { "epoch": 0.17, "learning_rate": 4.745375222298843e-06, "loss": 1.1874, "step": 5662 }, { "epoch": 0.17, "learning_rate": 4.745267962649176e-06, "loss": 1.2371, "step": 5663 }, { "epoch": 0.17, "learning_rate": 4.745160681625639e-06, "loss": 1.2135, "step": 5664 }, { "epoch": 0.17, "learning_rate": 4.745053379229253e-06, "loss": 1.0303, "step": 5665 }, { "epoch": 0.17, "learning_rate": 4.744946055461041e-06, "loss": 1.1893, "step": 5666 }, { "epoch": 0.17, "learning_rate": 4.744838710322024e-06, "loss": 1.1832, "step": 5667 }, { "epoch": 0.17, "learning_rate": 4.744731343813222e-06, "loss": 1.134, "step": 5668 }, { "epoch": 0.17, "learning_rate": 4.744623955935661e-06, "loss": 1.1515, "step": 5669 }, { "epoch": 0.17, "learning_rate": 4.7445165466903595e-06, "loss": 1.0977, "step": 5670 }, { "epoch": 0.17, "learning_rate": 4.7444091160783415e-06, "loss": 1.1093, "step": 5671 }, { "epoch": 0.17, "learning_rate": 4.74430166410063e-06, "loss": 1.1086, "step": 5672 }, { "epoch": 0.17, "learning_rate": 4.7441941907582475e-06, "loss": 1.113, "step": 5673 }, { "epoch": 0.17, "learning_rate": 4.744086696052217e-06, "loss": 1.1486, "step": 5674 }, { "epoch": 0.17, "learning_rate": 4.7439791799835626e-06, "loss": 1.1107, "step": 5675 }, { "epoch": 0.17, "learning_rate": 4.743871642553306e-06, "loss": 1.1326, "step": 5676 }, { "epoch": 0.17, "learning_rate": 4.743764083762473e-06, "loss": 1.186, "step": 5677 }, { "epoch": 0.17, "learning_rate": 4.743656503612087e-06, "loss": 1.1031, "step": 5678 }, { "epoch": 0.17, "learning_rate": 4.74354890210317e-06, "loss": 1.1702, "step": 5679 }, { "epoch": 0.17, "learning_rate": 4.743441279236749e-06, "loss": 1.2367, "step": 5680 }, { "epoch": 0.17, "learning_rate": 4.743333635013847e-06, "loss": 1.1442, "step": 5681 }, { "epoch": 0.17, "learning_rate": 4.7432259694354895e-06, "loss": 1.0792, "step": 5682 }, { "epoch": 0.17, "learning_rate": 4.743118282502703e-06, "loss": 1.2863, "step": 5683 }, { "epoch": 0.17, "learning_rate": 4.743010574216508e-06, "loss": 1.0743, "step": 5684 }, { "epoch": 0.17, "learning_rate": 4.742902844577934e-06, "loss": 1.2258, "step": 5685 }, { "epoch": 0.17, "learning_rate": 4.742795093588004e-06, "loss": 1.1952, "step": 5686 }, { "epoch": 0.17, "learning_rate": 4.742687321247746e-06, "loss": 1.1269, "step": 5687 }, { "epoch": 0.17, "learning_rate": 4.742579527558185e-06, "loss": 1.1504, "step": 5688 }, { "epoch": 0.17, "learning_rate": 4.742471712520346e-06, "loss": 1.1103, "step": 5689 }, { "epoch": 0.17, "learning_rate": 4.742363876135256e-06, "loss": 1.062, "step": 5690 }, { "epoch": 0.17, "learning_rate": 4.742256018403943e-06, "loss": 1.2657, "step": 5691 }, { "epoch": 0.17, "learning_rate": 4.7421481393274326e-06, "loss": 1.1396, "step": 5692 }, { "epoch": 0.17, "learning_rate": 4.742040238906751e-06, "loss": 1.1133, "step": 5693 }, { "epoch": 0.17, "learning_rate": 4.741932317142926e-06, "loss": 1.1678, "step": 5694 }, { "epoch": 0.17, "learning_rate": 4.741824374036986e-06, "loss": 1.1683, "step": 5695 }, { "epoch": 0.17, "learning_rate": 4.741716409589958e-06, "loss": 1.1197, "step": 5696 }, { "epoch": 0.17, "learning_rate": 4.741608423802868e-06, "loss": 1.1317, "step": 5697 }, { "epoch": 0.17, "learning_rate": 4.741500416676746e-06, "loss": 1.1918, "step": 5698 }, { "epoch": 0.17, "learning_rate": 4.74139238821262e-06, "loss": 1.2187, "step": 5699 }, { "epoch": 0.17, "learning_rate": 4.741284338411518e-06, "loss": 1.2037, "step": 5700 }, { "epoch": 0.17, "learning_rate": 4.7411762672744675e-06, "loss": 1.1311, "step": 5701 }, { "epoch": 0.17, "learning_rate": 4.7410681748024995e-06, "loss": 1.1329, "step": 5702 }, { "epoch": 0.17, "learning_rate": 4.740960060996641e-06, "loss": 1.0681, "step": 5703 }, { "epoch": 0.17, "learning_rate": 4.740851925857922e-06, "loss": 1.213, "step": 5704 }, { "epoch": 0.17, "learning_rate": 4.740743769387373e-06, "loss": 1.1732, "step": 5705 }, { "epoch": 0.17, "learning_rate": 4.7406355915860215e-06, "loss": 1.2332, "step": 5706 }, { "epoch": 0.17, "learning_rate": 4.740527392454898e-06, "loss": 1.1642, "step": 5707 }, { "epoch": 0.17, "learning_rate": 4.740419171995033e-06, "loss": 1.2925, "step": 5708 }, { "epoch": 0.17, "learning_rate": 4.740310930207458e-06, "loss": 1.1591, "step": 5709 }, { "epoch": 0.17, "learning_rate": 4.7402026670932e-06, "loss": 1.1331, "step": 5710 }, { "epoch": 0.17, "learning_rate": 4.740094382653292e-06, "loss": 1.0693, "step": 5711 }, { "epoch": 0.17, "learning_rate": 4.739986076888765e-06, "loss": 1.2311, "step": 5712 }, { "epoch": 0.17, "learning_rate": 4.739877749800648e-06, "loss": 1.2762, "step": 5713 }, { "epoch": 0.17, "learning_rate": 4.739769401389975e-06, "loss": 1.1754, "step": 5714 }, { "epoch": 0.17, "learning_rate": 4.7396610316577765e-06, "loss": 1.0999, "step": 5715 }, { "epoch": 0.17, "learning_rate": 4.739552640605082e-06, "loss": 1.1145, "step": 5716 }, { "epoch": 0.17, "learning_rate": 4.739444228232925e-06, "loss": 1.1238, "step": 5717 }, { "epoch": 0.17, "learning_rate": 4.739335794542339e-06, "loss": 1.165, "step": 5718 }, { "epoch": 0.17, "learning_rate": 4.739227339534354e-06, "loss": 1.2449, "step": 5719 }, { "epoch": 0.17, "learning_rate": 4.739118863210003e-06, "loss": 1.1027, "step": 5720 }, { "epoch": 0.17, "learning_rate": 4.739010365570318e-06, "loss": 1.1255, "step": 5721 }, { "epoch": 0.17, "learning_rate": 4.738901846616334e-06, "loss": 1.0936, "step": 5722 }, { "epoch": 0.17, "learning_rate": 4.738793306349082e-06, "loss": 1.1193, "step": 5723 }, { "epoch": 0.17, "learning_rate": 4.738684744769597e-06, "loss": 1.0358, "step": 5724 }, { "epoch": 0.17, "learning_rate": 4.73857616187891e-06, "loss": 1.1431, "step": 5725 }, { "epoch": 0.17, "learning_rate": 4.738467557678057e-06, "loss": 1.1904, "step": 5726 }, { "epoch": 0.17, "learning_rate": 4.738358932168071e-06, "loss": 1.146, "step": 5727 }, { "epoch": 0.17, "learning_rate": 4.738250285349985e-06, "loss": 1.2111, "step": 5728 }, { "epoch": 0.17, "learning_rate": 4.738141617224835e-06, "loss": 1.1447, "step": 5729 }, { "epoch": 0.17, "learning_rate": 4.7380329277936545e-06, "loss": 1.1174, "step": 5730 }, { "epoch": 0.17, "learning_rate": 4.737924217057479e-06, "loss": 1.261, "step": 5731 }, { "epoch": 0.17, "learning_rate": 4.737815485017342e-06, "loss": 1.1846, "step": 5732 }, { "epoch": 0.17, "learning_rate": 4.73770673167428e-06, "loss": 1.1707, "step": 5733 }, { "epoch": 0.17, "learning_rate": 4.737597957029327e-06, "loss": 1.1704, "step": 5734 }, { "epoch": 0.17, "learning_rate": 4.737489161083519e-06, "loss": 1.1062, "step": 5735 }, { "epoch": 0.17, "learning_rate": 4.737380343837893e-06, "loss": 1.1597, "step": 5736 }, { "epoch": 0.17, "learning_rate": 4.737271505293482e-06, "loss": 1.1838, "step": 5737 }, { "epoch": 0.17, "learning_rate": 4.7371626454513255e-06, "loss": 1.1434, "step": 5738 }, { "epoch": 0.17, "learning_rate": 4.737053764312457e-06, "loss": 1.25, "step": 5739 }, { "epoch": 0.17, "learning_rate": 4.736944861877914e-06, "loss": 1.1146, "step": 5740 }, { "epoch": 0.17, "learning_rate": 4.736835938148734e-06, "loss": 1.202, "step": 5741 }, { "epoch": 0.17, "learning_rate": 4.736726993125953e-06, "loss": 1.2382, "step": 5742 }, { "epoch": 0.17, "learning_rate": 4.736618026810608e-06, "loss": 1.1831, "step": 5743 }, { "epoch": 0.17, "learning_rate": 4.736509039203736e-06, "loss": 1.0616, "step": 5744 }, { "epoch": 0.17, "learning_rate": 4.736400030306376e-06, "loss": 1.1375, "step": 5745 }, { "epoch": 0.17, "learning_rate": 4.736291000119564e-06, "loss": 1.241, "step": 5746 }, { "epoch": 0.17, "learning_rate": 4.7361819486443395e-06, "loss": 0.999, "step": 5747 }, { "epoch": 0.17, "learning_rate": 4.736072875881739e-06, "loss": 1.087, "step": 5748 }, { "epoch": 0.17, "learning_rate": 4.735963781832802e-06, "loss": 1.2711, "step": 5749 }, { "epoch": 0.17, "learning_rate": 4.735854666498567e-06, "loss": 1.2129, "step": 5750 }, { "epoch": 0.17, "learning_rate": 4.735745529880073e-06, "loss": 1.1536, "step": 5751 }, { "epoch": 0.17, "learning_rate": 4.735636371978357e-06, "loss": 1.0687, "step": 5752 }, { "epoch": 0.17, "learning_rate": 4.73552719279446e-06, "loss": 1.0732, "step": 5753 }, { "epoch": 0.17, "learning_rate": 4.735417992329421e-06, "loss": 1.2078, "step": 5754 }, { "epoch": 0.17, "learning_rate": 4.735308770584279e-06, "loss": 1.1682, "step": 5755 }, { "epoch": 0.17, "learning_rate": 4.735199527560074e-06, "loss": 1.0764, "step": 5756 }, { "epoch": 0.17, "learning_rate": 4.735090263257847e-06, "loss": 1.1951, "step": 5757 }, { "epoch": 0.17, "learning_rate": 4.7349809776786355e-06, "loss": 1.2082, "step": 5758 }, { "epoch": 0.17, "learning_rate": 4.734871670823482e-06, "loss": 1.1208, "step": 5759 }, { "epoch": 0.17, "learning_rate": 4.734762342693428e-06, "loss": 1.1242, "step": 5760 }, { "epoch": 0.17, "learning_rate": 4.734652993289511e-06, "loss": 1.1287, "step": 5761 }, { "epoch": 0.17, "learning_rate": 4.734543622612774e-06, "loss": 1.3248, "step": 5762 }, { "epoch": 0.17, "learning_rate": 4.734434230664259e-06, "loss": 1.1852, "step": 5763 }, { "epoch": 0.17, "learning_rate": 4.734324817445005e-06, "loss": 1.1759, "step": 5764 }, { "epoch": 0.17, "learning_rate": 4.734215382956056e-06, "loss": 1.1897, "step": 5765 }, { "epoch": 0.17, "learning_rate": 4.7341059271984515e-06, "loss": 1.1834, "step": 5766 }, { "epoch": 0.17, "learning_rate": 4.733996450173235e-06, "loss": 1.1854, "step": 5767 }, { "epoch": 0.17, "learning_rate": 4.733886951881449e-06, "loss": 1.1725, "step": 5768 }, { "epoch": 0.17, "learning_rate": 4.733777432324134e-06, "loss": 1.1677, "step": 5769 }, { "epoch": 0.17, "learning_rate": 4.7336678915023335e-06, "loss": 1.1814, "step": 5770 }, { "epoch": 0.17, "learning_rate": 4.7335583294170915e-06, "loss": 1.1287, "step": 5771 }, { "epoch": 0.17, "learning_rate": 4.73344874606945e-06, "loss": 1.1235, "step": 5772 }, { "epoch": 0.17, "learning_rate": 4.733339141460451e-06, "loss": 1.1462, "step": 5773 }, { "epoch": 0.17, "learning_rate": 4.7332295155911395e-06, "loss": 1.1841, "step": 5774 }, { "epoch": 0.17, "learning_rate": 4.733119868462559e-06, "loss": 1.1931, "step": 5775 }, { "epoch": 0.17, "learning_rate": 4.733010200075752e-06, "loss": 1.0857, "step": 5776 }, { "epoch": 0.17, "learning_rate": 4.732900510431764e-06, "loss": 1.0972, "step": 5777 }, { "epoch": 0.17, "learning_rate": 4.732790799531638e-06, "loss": 1.1199, "step": 5778 }, { "epoch": 0.17, "learning_rate": 4.732681067376419e-06, "loss": 1.1638, "step": 5779 }, { "epoch": 0.17, "learning_rate": 4.732571313967152e-06, "loss": 1.1811, "step": 5780 }, { "epoch": 0.17, "learning_rate": 4.732461539304881e-06, "loss": 1.3009, "step": 5781 }, { "epoch": 0.17, "learning_rate": 4.732351743390652e-06, "loss": 1.0652, "step": 5782 }, { "epoch": 0.17, "learning_rate": 4.732241926225509e-06, "loss": 1.0646, "step": 5783 }, { "epoch": 0.17, "learning_rate": 4.732132087810498e-06, "loss": 1.2261, "step": 5784 }, { "epoch": 0.17, "learning_rate": 4.732022228146664e-06, "loss": 1.1785, "step": 5785 }, { "epoch": 0.17, "learning_rate": 4.7319123472350546e-06, "loss": 1.1472, "step": 5786 }, { "epoch": 0.17, "learning_rate": 4.731802445076714e-06, "loss": 1.0569, "step": 5787 }, { "epoch": 0.17, "learning_rate": 4.731692521672688e-06, "loss": 1.1716, "step": 5788 }, { "epoch": 0.17, "learning_rate": 4.731582577024026e-06, "loss": 1.2284, "step": 5789 }, { "epoch": 0.17, "learning_rate": 4.7314726111317714e-06, "loss": 1.0691, "step": 5790 }, { "epoch": 0.17, "learning_rate": 4.731362623996972e-06, "loss": 1.2162, "step": 5791 }, { "epoch": 0.17, "learning_rate": 4.731252615620675e-06, "loss": 1.3097, "step": 5792 }, { "epoch": 0.17, "learning_rate": 4.731142586003928e-06, "loss": 1.1086, "step": 5793 }, { "epoch": 0.17, "learning_rate": 4.731032535147779e-06, "loss": 1.0952, "step": 5794 }, { "epoch": 0.17, "learning_rate": 4.730922463053274e-06, "loss": 1.037, "step": 5795 }, { "epoch": 0.17, "learning_rate": 4.730812369721461e-06, "loss": 1.1378, "step": 5796 }, { "epoch": 0.17, "learning_rate": 4.73070225515339e-06, "loss": 1.2426, "step": 5797 }, { "epoch": 0.17, "learning_rate": 4.730592119350107e-06, "loss": 1.0581, "step": 5798 }, { "epoch": 0.17, "learning_rate": 4.730481962312662e-06, "loss": 1.1022, "step": 5799 }, { "epoch": 0.17, "learning_rate": 4.730371784042102e-06, "loss": 1.069, "step": 5800 }, { "epoch": 0.17, "learning_rate": 4.730261584539478e-06, "loss": 1.1367, "step": 5801 }, { "epoch": 0.17, "learning_rate": 4.730151363805836e-06, "loss": 1.1285, "step": 5802 }, { "epoch": 0.17, "learning_rate": 4.730041121842229e-06, "loss": 1.0363, "step": 5803 }, { "epoch": 0.17, "learning_rate": 4.729930858649703e-06, "loss": 1.2523, "step": 5804 }, { "epoch": 0.17, "learning_rate": 4.72982057422931e-06, "loss": 1.1599, "step": 5805 }, { "epoch": 0.17, "learning_rate": 4.7297102685821e-06, "loss": 1.1196, "step": 5806 }, { "epoch": 0.17, "learning_rate": 4.72959994170912e-06, "loss": 1.095, "step": 5807 }, { "epoch": 0.17, "learning_rate": 4.729489593611424e-06, "loss": 1.1554, "step": 5808 }, { "epoch": 0.17, "learning_rate": 4.7293792242900605e-06, "loss": 1.1395, "step": 5809 }, { "epoch": 0.18, "learning_rate": 4.72926883374608e-06, "loss": 1.2498, "step": 5810 }, { "epoch": 0.18, "learning_rate": 4.729158421980534e-06, "loss": 1.1956, "step": 5811 }, { "epoch": 0.18, "learning_rate": 4.729047988994473e-06, "loss": 1.0873, "step": 5812 }, { "epoch": 0.18, "learning_rate": 4.72893753478895e-06, "loss": 1.1592, "step": 5813 }, { "epoch": 0.18, "learning_rate": 4.728827059365014e-06, "loss": 1.1088, "step": 5814 }, { "epoch": 0.18, "learning_rate": 4.728716562723718e-06, "loss": 1.0882, "step": 5815 }, { "epoch": 0.18, "learning_rate": 4.728606044866114e-06, "loss": 1.0612, "step": 5816 }, { "epoch": 0.18, "learning_rate": 4.728495505793254e-06, "loss": 1.2762, "step": 5817 }, { "epoch": 0.18, "learning_rate": 4.72838494550619e-06, "loss": 1.1875, "step": 5818 }, { "epoch": 0.18, "learning_rate": 4.728274364005974e-06, "loss": 1.2311, "step": 5819 }, { "epoch": 0.18, "learning_rate": 4.72816376129366e-06, "loss": 1.1604, "step": 5820 }, { "epoch": 0.18, "learning_rate": 4.7280531373703e-06, "loss": 1.0126, "step": 5821 }, { "epoch": 0.18, "learning_rate": 4.727942492236947e-06, "loss": 1.0026, "step": 5822 }, { "epoch": 0.18, "learning_rate": 4.7278318258946536e-06, "loss": 1.1952, "step": 5823 }, { "epoch": 0.18, "learning_rate": 4.7277211383444755e-06, "loss": 1.0819, "step": 5824 }, { "epoch": 0.18, "learning_rate": 4.727610429587464e-06, "loss": 1.1707, "step": 5825 }, { "epoch": 0.18, "learning_rate": 4.727499699624675e-06, "loss": 1.1978, "step": 5826 }, { "epoch": 0.18, "learning_rate": 4.7273889484571614e-06, "loss": 1.1458, "step": 5827 }, { "epoch": 0.18, "learning_rate": 4.727278176085977e-06, "loss": 1.1665, "step": 5828 }, { "epoch": 0.18, "learning_rate": 4.727167382512178e-06, "loss": 1.1516, "step": 5829 }, { "epoch": 0.18, "learning_rate": 4.7270565677368176e-06, "loss": 1.1589, "step": 5830 }, { "epoch": 0.18, "learning_rate": 4.726945731760951e-06, "loss": 1.2101, "step": 5831 }, { "epoch": 0.18, "learning_rate": 4.726834874585635e-06, "loss": 1.2144, "step": 5832 }, { "epoch": 0.18, "learning_rate": 4.726723996211922e-06, "loss": 1.2242, "step": 5833 }, { "epoch": 0.18, "learning_rate": 4.72661309664087e-06, "loss": 1.0941, "step": 5834 }, { "epoch": 0.18, "learning_rate": 4.726502175873533e-06, "loss": 1.1106, "step": 5835 }, { "epoch": 0.18, "learning_rate": 4.726391233910967e-06, "loss": 1.1439, "step": 5836 }, { "epoch": 0.18, "learning_rate": 4.72628027075423e-06, "loss": 1.2582, "step": 5837 }, { "epoch": 0.18, "learning_rate": 4.726169286404376e-06, "loss": 1.2261, "step": 5838 }, { "epoch": 0.18, "learning_rate": 4.726058280862464e-06, "loss": 1.126, "step": 5839 }, { "epoch": 0.18, "learning_rate": 4.725947254129548e-06, "loss": 1.1648, "step": 5840 }, { "epoch": 0.18, "learning_rate": 4.725836206206686e-06, "loss": 1.1178, "step": 5841 }, { "epoch": 0.18, "learning_rate": 4.725725137094937e-06, "loss": 1.1511, "step": 5842 }, { "epoch": 0.18, "learning_rate": 4.725614046795355e-06, "loss": 1.194, "step": 5843 }, { "epoch": 0.18, "learning_rate": 4.725502935309e-06, "loss": 1.0922, "step": 5844 }, { "epoch": 0.18, "learning_rate": 4.725391802636928e-06, "loss": 1.2018, "step": 5845 }, { "epoch": 0.18, "learning_rate": 4.725280648780199e-06, "loss": 1.1652, "step": 5846 }, { "epoch": 0.18, "learning_rate": 4.7251694737398695e-06, "loss": 1.2025, "step": 5847 }, { "epoch": 0.18, "learning_rate": 4.7250582775169985e-06, "loss": 1.2555, "step": 5848 }, { "epoch": 0.18, "learning_rate": 4.724947060112644e-06, "loss": 1.1037, "step": 5849 }, { "epoch": 0.18, "learning_rate": 4.7248358215278645e-06, "loss": 1.1866, "step": 5850 }, { "epoch": 0.18, "learning_rate": 4.724724561763721e-06, "loss": 1.1566, "step": 5851 }, { "epoch": 0.18, "learning_rate": 4.72461328082127e-06, "loss": 1.0645, "step": 5852 }, { "epoch": 0.18, "learning_rate": 4.7245019787015716e-06, "loss": 1.1954, "step": 5853 }, { "epoch": 0.18, "learning_rate": 4.724390655405686e-06, "loss": 1.1046, "step": 5854 }, { "epoch": 0.18, "learning_rate": 4.724279310934673e-06, "loss": 1.1263, "step": 5855 }, { "epoch": 0.18, "learning_rate": 4.724167945289593e-06, "loss": 1.1925, "step": 5856 }, { "epoch": 0.18, "learning_rate": 4.724056558471504e-06, "loss": 1.1782, "step": 5857 }, { "epoch": 0.18, "learning_rate": 4.723945150481468e-06, "loss": 1.2637, "step": 5858 }, { "epoch": 0.18, "learning_rate": 4.7238337213205455e-06, "loss": 1.0854, "step": 5859 }, { "epoch": 0.18, "learning_rate": 4.723722270989797e-06, "loss": 1.1824, "step": 5860 }, { "epoch": 0.18, "learning_rate": 4.723610799490284e-06, "loss": 1.2516, "step": 5861 }, { "epoch": 0.18, "learning_rate": 4.723499306823066e-06, "loss": 1.1423, "step": 5862 }, { "epoch": 0.18, "learning_rate": 4.723387792989206e-06, "loss": 1.2233, "step": 5863 }, { "epoch": 0.18, "learning_rate": 4.723276257989765e-06, "loss": 1.2269, "step": 5864 }, { "epoch": 0.18, "learning_rate": 4.723164701825805e-06, "loss": 1.1316, "step": 5865 }, { "epoch": 0.18, "learning_rate": 4.723053124498388e-06, "loss": 0.9932, "step": 5866 }, { "epoch": 0.18, "learning_rate": 4.7229415260085756e-06, "loss": 1.1011, "step": 5867 }, { "epoch": 0.18, "learning_rate": 4.72282990635743e-06, "loss": 1.2937, "step": 5868 }, { "epoch": 0.18, "learning_rate": 4.722718265546015e-06, "loss": 1.1452, "step": 5869 }, { "epoch": 0.18, "learning_rate": 4.722606603575392e-06, "loss": 1.1683, "step": 5870 }, { "epoch": 0.18, "learning_rate": 4.722494920446625e-06, "loss": 1.1415, "step": 5871 }, { "epoch": 0.18, "learning_rate": 4.722383216160776e-06, "loss": 1.2638, "step": 5872 }, { "epoch": 0.18, "learning_rate": 4.72227149071891e-06, "loss": 1.2326, "step": 5873 }, { "epoch": 0.18, "learning_rate": 4.722159744122089e-06, "loss": 1.2415, "step": 5874 }, { "epoch": 0.18, "learning_rate": 4.722047976371378e-06, "loss": 1.0273, "step": 5875 }, { "epoch": 0.18, "learning_rate": 4.721936187467841e-06, "loss": 1.1956, "step": 5876 }, { "epoch": 0.18, "learning_rate": 4.721824377412541e-06, "loss": 1.142, "step": 5877 }, { "epoch": 0.18, "learning_rate": 4.721712546206543e-06, "loss": 1.1826, "step": 5878 }, { "epoch": 0.18, "learning_rate": 4.72160069385091e-06, "loss": 1.1519, "step": 5879 }, { "epoch": 0.18, "learning_rate": 4.72148882034671e-06, "loss": 1.2303, "step": 5880 }, { "epoch": 0.18, "learning_rate": 4.721376925695007e-06, "loss": 1.1583, "step": 5881 }, { "epoch": 0.18, "learning_rate": 4.721265009896865e-06, "loss": 1.1541, "step": 5882 }, { "epoch": 0.18, "learning_rate": 4.72115307295335e-06, "loss": 1.1366, "step": 5883 }, { "epoch": 0.18, "learning_rate": 4.721041114865526e-06, "loss": 1.0782, "step": 5884 }, { "epoch": 0.18, "learning_rate": 4.720929135634462e-06, "loss": 1.1221, "step": 5885 }, { "epoch": 0.18, "learning_rate": 4.7208171352612205e-06, "loss": 1.2039, "step": 5886 }, { "epoch": 0.18, "learning_rate": 4.720705113746871e-06, "loss": 1.1702, "step": 5887 }, { "epoch": 0.18, "learning_rate": 4.720593071092478e-06, "loss": 1.1021, "step": 5888 }, { "epoch": 0.18, "learning_rate": 4.720481007299109e-06, "loss": 1.1957, "step": 5889 }, { "epoch": 0.18, "learning_rate": 4.7203689223678294e-06, "loss": 1.1887, "step": 5890 }, { "epoch": 0.18, "learning_rate": 4.720256816299707e-06, "loss": 1.115, "step": 5891 }, { "epoch": 0.18, "learning_rate": 4.720144689095809e-06, "loss": 1.0497, "step": 5892 }, { "epoch": 0.18, "learning_rate": 4.720032540757203e-06, "loss": 1.1153, "step": 5893 }, { "epoch": 0.18, "learning_rate": 4.719920371284957e-06, "loss": 1.1725, "step": 5894 }, { "epoch": 0.18, "learning_rate": 4.7198081806801375e-06, "loss": 1.1414, "step": 5895 }, { "epoch": 0.18, "learning_rate": 4.719695968943813e-06, "loss": 1.1683, "step": 5896 }, { "epoch": 0.18, "learning_rate": 4.719583736077053e-06, "loss": 1.1725, "step": 5897 }, { "epoch": 0.18, "learning_rate": 4.719471482080924e-06, "loss": 1.2302, "step": 5898 }, { "epoch": 0.18, "learning_rate": 4.7193592069564956e-06, "loss": 1.2582, "step": 5899 }, { "epoch": 0.18, "learning_rate": 4.719246910704836e-06, "loss": 1.3387, "step": 5900 }, { "epoch": 0.18, "learning_rate": 4.719134593327015e-06, "loss": 1.1791, "step": 5901 }, { "epoch": 0.18, "learning_rate": 4.719022254824102e-06, "loss": 1.0442, "step": 5902 }, { "epoch": 0.18, "learning_rate": 4.7189098951971645e-06, "loss": 1.1228, "step": 5903 }, { "epoch": 0.18, "learning_rate": 4.718797514447275e-06, "loss": 1.1472, "step": 5904 }, { "epoch": 0.18, "learning_rate": 4.718685112575501e-06, "loss": 1.1407, "step": 5905 }, { "epoch": 0.18, "learning_rate": 4.718572689582913e-06, "loss": 1.1459, "step": 5906 }, { "epoch": 0.18, "learning_rate": 4.718460245470582e-06, "loss": 1.187, "step": 5907 }, { "epoch": 0.18, "learning_rate": 4.718347780239578e-06, "loss": 1.0871, "step": 5908 }, { "epoch": 0.18, "learning_rate": 4.718235293890971e-06, "loss": 1.1013, "step": 5909 }, { "epoch": 0.18, "learning_rate": 4.718122786425833e-06, "loss": 1.1567, "step": 5910 }, { "epoch": 0.18, "learning_rate": 4.718010257845234e-06, "loss": 1.088, "step": 5911 }, { "epoch": 0.18, "learning_rate": 4.717897708150245e-06, "loss": 1.2122, "step": 5912 }, { "epoch": 0.18, "learning_rate": 4.7177851373419385e-06, "loss": 1.174, "step": 5913 }, { "epoch": 0.18, "learning_rate": 4.717672545421386e-06, "loss": 1.2136, "step": 5914 }, { "epoch": 0.18, "learning_rate": 4.717559932389658e-06, "loss": 1.1838, "step": 5915 }, { "epoch": 0.18, "learning_rate": 4.7174472982478285e-06, "loss": 1.1885, "step": 5916 }, { "epoch": 0.18, "learning_rate": 4.717334642996968e-06, "loss": 1.1937, "step": 5917 }, { "epoch": 0.18, "learning_rate": 4.71722196663815e-06, "loss": 1.2341, "step": 5918 }, { "epoch": 0.18, "learning_rate": 4.717109269172446e-06, "loss": 1.1198, "step": 5919 }, { "epoch": 0.18, "learning_rate": 4.71699655060093e-06, "loss": 1.0998, "step": 5920 }, { "epoch": 0.18, "learning_rate": 4.716883810924675e-06, "loss": 1.0839, "step": 5921 }, { "epoch": 0.18, "learning_rate": 4.716771050144754e-06, "loss": 1.1141, "step": 5922 }, { "epoch": 0.18, "learning_rate": 4.71665826826224e-06, "loss": 1.1157, "step": 5923 }, { "epoch": 0.18, "learning_rate": 4.716545465278206e-06, "loss": 1.1772, "step": 5924 }, { "epoch": 0.18, "learning_rate": 4.716432641193728e-06, "loss": 1.1701, "step": 5925 }, { "epoch": 0.18, "learning_rate": 4.7163197960098775e-06, "loss": 1.0554, "step": 5926 }, { "epoch": 0.18, "learning_rate": 4.716206929727731e-06, "loss": 1.0982, "step": 5927 }, { "epoch": 0.18, "learning_rate": 4.716094042348362e-06, "loss": 1.1037, "step": 5928 }, { "epoch": 0.18, "learning_rate": 4.715981133872843e-06, "loss": 1.0888, "step": 5929 }, { "epoch": 0.18, "learning_rate": 4.715868204302253e-06, "loss": 1.1555, "step": 5930 }, { "epoch": 0.18, "learning_rate": 4.715755253637664e-06, "loss": 1.0562, "step": 5931 }, { "epoch": 0.18, "learning_rate": 4.7156422818801525e-06, "loss": 1.1284, "step": 5932 }, { "epoch": 0.18, "learning_rate": 4.715529289030793e-06, "loss": 1.1382, "step": 5933 }, { "epoch": 0.18, "learning_rate": 4.715416275090662e-06, "loss": 1.1376, "step": 5934 }, { "epoch": 0.18, "learning_rate": 4.715303240060835e-06, "loss": 1.0914, "step": 5935 }, { "epoch": 0.18, "learning_rate": 4.715190183942388e-06, "loss": 1.1653, "step": 5936 }, { "epoch": 0.18, "learning_rate": 4.7150771067363975e-06, "loss": 1.1833, "step": 5937 }, { "epoch": 0.18, "learning_rate": 4.714964008443941e-06, "loss": 1.152, "step": 5938 }, { "epoch": 0.18, "learning_rate": 4.714850889066092e-06, "loss": 1.0626, "step": 5939 }, { "epoch": 0.18, "learning_rate": 4.7147377486039295e-06, "loss": 1.158, "step": 5940 }, { "epoch": 0.18, "learning_rate": 4.714624587058531e-06, "loss": 1.1371, "step": 5941 }, { "epoch": 0.18, "learning_rate": 4.714511404430973e-06, "loss": 1.1638, "step": 5942 }, { "epoch": 0.18, "learning_rate": 4.714398200722332e-06, "loss": 1.2308, "step": 5943 }, { "epoch": 0.18, "learning_rate": 4.714284975933687e-06, "loss": 1.1569, "step": 5944 }, { "epoch": 0.18, "learning_rate": 4.714171730066116e-06, "loss": 1.1705, "step": 5945 }, { "epoch": 0.18, "learning_rate": 4.714058463120696e-06, "loss": 1.1975, "step": 5946 }, { "epoch": 0.18, "learning_rate": 4.7139451750985065e-06, "loss": 1.0565, "step": 5947 }, { "epoch": 0.18, "learning_rate": 4.713831866000625e-06, "loss": 1.249, "step": 5948 }, { "epoch": 0.18, "learning_rate": 4.71371853582813e-06, "loss": 1.1062, "step": 5949 }, { "epoch": 0.18, "learning_rate": 4.713605184582101e-06, "loss": 1.2361, "step": 5950 }, { "epoch": 0.18, "learning_rate": 4.713491812263616e-06, "loss": 1.1357, "step": 5951 }, { "epoch": 0.18, "learning_rate": 4.713378418873757e-06, "loss": 1.1362, "step": 5952 }, { "epoch": 0.18, "learning_rate": 4.713265004413599e-06, "loss": 1.1105, "step": 5953 }, { "epoch": 0.18, "learning_rate": 4.713151568884226e-06, "loss": 1.2318, "step": 5954 }, { "epoch": 0.18, "learning_rate": 4.7130381122867145e-06, "loss": 1.1411, "step": 5955 }, { "epoch": 0.18, "learning_rate": 4.712924634622147e-06, "loss": 1.0914, "step": 5956 }, { "epoch": 0.18, "learning_rate": 4.7128111358916016e-06, "loss": 1.2146, "step": 5957 }, { "epoch": 0.18, "learning_rate": 4.7126976160961616e-06, "loss": 1.2012, "step": 5958 }, { "epoch": 0.18, "learning_rate": 4.7125840752369045e-06, "loss": 1.2228, "step": 5959 }, { "epoch": 0.18, "learning_rate": 4.712470513314913e-06, "loss": 1.2043, "step": 5960 }, { "epoch": 0.18, "learning_rate": 4.712356930331268e-06, "loss": 1.1747, "step": 5961 }, { "epoch": 0.18, "learning_rate": 4.71224332628705e-06, "loss": 1.2228, "step": 5962 }, { "epoch": 0.18, "learning_rate": 4.712129701183341e-06, "loss": 1.2073, "step": 5963 }, { "epoch": 0.18, "learning_rate": 4.7120160550212235e-06, "loss": 1.2031, "step": 5964 }, { "epoch": 0.18, "learning_rate": 4.7119023878017785e-06, "loss": 1.1962, "step": 5965 }, { "epoch": 0.18, "learning_rate": 4.711788699526087e-06, "loss": 1.1194, "step": 5966 }, { "epoch": 0.18, "learning_rate": 4.711674990195234e-06, "loss": 1.1819, "step": 5967 }, { "epoch": 0.18, "learning_rate": 4.711561259810299e-06, "loss": 1.314, "step": 5968 }, { "epoch": 0.18, "learning_rate": 4.711447508372366e-06, "loss": 1.1962, "step": 5969 }, { "epoch": 0.18, "learning_rate": 4.711333735882518e-06, "loss": 1.1121, "step": 5970 }, { "epoch": 0.18, "learning_rate": 4.711219942341838e-06, "loss": 1.0791, "step": 5971 }, { "epoch": 0.18, "learning_rate": 4.711106127751408e-06, "loss": 1.0894, "step": 5972 }, { "epoch": 0.18, "learning_rate": 4.710992292112314e-06, "loss": 1.0952, "step": 5973 }, { "epoch": 0.18, "learning_rate": 4.710878435425637e-06, "loss": 1.0672, "step": 5974 }, { "epoch": 0.18, "learning_rate": 4.710764557692463e-06, "loss": 1.1289, "step": 5975 }, { "epoch": 0.18, "learning_rate": 4.710650658913876e-06, "loss": 1.1295, "step": 5976 }, { "epoch": 0.18, "learning_rate": 4.710536739090958e-06, "loss": 1.1186, "step": 5977 }, { "epoch": 0.18, "learning_rate": 4.7104227982247955e-06, "loss": 1.0634, "step": 5978 }, { "epoch": 0.18, "learning_rate": 4.710308836316472e-06, "loss": 1.1255, "step": 5979 }, { "epoch": 0.18, "learning_rate": 4.710194853367074e-06, "loss": 1.2563, "step": 5980 }, { "epoch": 0.18, "learning_rate": 4.710080849377684e-06, "loss": 1.3062, "step": 5981 }, { "epoch": 0.18, "learning_rate": 4.709966824349389e-06, "loss": 1.0984, "step": 5982 }, { "epoch": 0.18, "learning_rate": 4.709852778283275e-06, "loss": 1.2363, "step": 5983 }, { "epoch": 0.18, "learning_rate": 4.709738711180426e-06, "loss": 1.1016, "step": 5984 }, { "epoch": 0.18, "learning_rate": 4.70962462304193e-06, "loss": 1.1327, "step": 5985 }, { "epoch": 0.18, "learning_rate": 4.70951051386887e-06, "loss": 1.2665, "step": 5986 }, { "epoch": 0.18, "learning_rate": 4.709396383662334e-06, "loss": 1.2076, "step": 5987 }, { "epoch": 0.18, "learning_rate": 4.7092822324234105e-06, "loss": 1.202, "step": 5988 }, { "epoch": 0.18, "learning_rate": 4.709168060153183e-06, "loss": 1.0997, "step": 5989 }, { "epoch": 0.18, "learning_rate": 4.70905386685274e-06, "loss": 1.1981, "step": 5990 }, { "epoch": 0.18, "learning_rate": 4.7089396525231676e-06, "loss": 1.0938, "step": 5991 }, { "epoch": 0.18, "learning_rate": 4.708825417165553e-06, "loss": 1.0494, "step": 5992 }, { "epoch": 0.18, "learning_rate": 4.708711160780986e-06, "loss": 1.2291, "step": 5993 }, { "epoch": 0.18, "learning_rate": 4.708596883370551e-06, "loss": 1.107, "step": 5994 }, { "epoch": 0.18, "learning_rate": 4.708482584935338e-06, "loss": 1.2523, "step": 5995 }, { "epoch": 0.18, "learning_rate": 4.708368265476434e-06, "loss": 1.054, "step": 5996 }, { "epoch": 0.18, "learning_rate": 4.708253924994928e-06, "loss": 1.049, "step": 5997 }, { "epoch": 0.18, "learning_rate": 4.708139563491908e-06, "loss": 1.2289, "step": 5998 }, { "epoch": 0.18, "learning_rate": 4.7080251809684635e-06, "loss": 1.4247, "step": 5999 }, { "epoch": 0.18, "learning_rate": 4.707910777425681e-06, "loss": 1.1728, "step": 6000 }, { "epoch": 0.18, "learning_rate": 4.707796352864653e-06, "loss": 1.2828, "step": 6001 }, { "epoch": 0.18, "learning_rate": 4.707681907286467e-06, "loss": 1.1046, "step": 6002 }, { "epoch": 0.18, "learning_rate": 4.707567440692212e-06, "loss": 1.1583, "step": 6003 }, { "epoch": 0.18, "learning_rate": 4.707452953082978e-06, "loss": 1.2365, "step": 6004 }, { "epoch": 0.18, "learning_rate": 4.707338444459855e-06, "loss": 1.1747, "step": 6005 }, { "epoch": 0.18, "learning_rate": 4.707223914823933e-06, "loss": 1.196, "step": 6006 }, { "epoch": 0.18, "learning_rate": 4.707109364176303e-06, "loss": 1.1561, "step": 6007 }, { "epoch": 0.18, "learning_rate": 4.706994792518054e-06, "loss": 1.1918, "step": 6008 }, { "epoch": 0.18, "learning_rate": 4.706880199850279e-06, "loss": 1.1, "step": 6009 }, { "epoch": 0.18, "learning_rate": 4.706765586174066e-06, "loss": 1.1268, "step": 6010 }, { "epoch": 0.18, "learning_rate": 4.706650951490508e-06, "loss": 1.1573, "step": 6011 }, { "epoch": 0.18, "learning_rate": 4.706536295800696e-06, "loss": 1.2206, "step": 6012 }, { "epoch": 0.18, "learning_rate": 4.70642161910572e-06, "loss": 1.1268, "step": 6013 }, { "epoch": 0.18, "learning_rate": 4.706306921406673e-06, "loss": 1.1986, "step": 6014 }, { "epoch": 0.18, "learning_rate": 4.706192202704648e-06, "loss": 1.1995, "step": 6015 }, { "epoch": 0.18, "learning_rate": 4.706077463000734e-06, "loss": 1.1069, "step": 6016 }, { "epoch": 0.18, "learning_rate": 4.705962702296026e-06, "loss": 1.2539, "step": 6017 }, { "epoch": 0.18, "learning_rate": 4.705847920591616e-06, "loss": 1.1365, "step": 6018 }, { "epoch": 0.18, "learning_rate": 4.7057331178885954e-06, "loss": 1.1929, "step": 6019 }, { "epoch": 0.18, "learning_rate": 4.705618294188058e-06, "loss": 1.1846, "step": 6020 }, { "epoch": 0.18, "learning_rate": 4.705503449491096e-06, "loss": 0.9722, "step": 6021 }, { "epoch": 0.18, "learning_rate": 4.705388583798805e-06, "loss": 1.2217, "step": 6022 }, { "epoch": 0.18, "learning_rate": 4.705273697112276e-06, "loss": 1.0921, "step": 6023 }, { "epoch": 0.18, "learning_rate": 4.705158789432603e-06, "loss": 1.1411, "step": 6024 }, { "epoch": 0.18, "learning_rate": 4.705043860760881e-06, "loss": 1.2045, "step": 6025 }, { "epoch": 0.18, "learning_rate": 4.704928911098204e-06, "loss": 1.0812, "step": 6026 }, { "epoch": 0.18, "learning_rate": 4.704813940445665e-06, "loss": 1.1293, "step": 6027 }, { "epoch": 0.18, "learning_rate": 4.704698948804359e-06, "loss": 1.1111, "step": 6028 }, { "epoch": 0.18, "learning_rate": 4.704583936175381e-06, "loss": 1.2217, "step": 6029 }, { "epoch": 0.18, "learning_rate": 4.704468902559826e-06, "loss": 1.1447, "step": 6030 }, { "epoch": 0.18, "learning_rate": 4.704353847958788e-06, "loss": 1.1746, "step": 6031 }, { "epoch": 0.18, "learning_rate": 4.704238772373363e-06, "loss": 1.0733, "step": 6032 }, { "epoch": 0.18, "learning_rate": 4.704123675804647e-06, "loss": 1.1777, "step": 6033 }, { "epoch": 0.18, "learning_rate": 4.704008558253736e-06, "loss": 1.1771, "step": 6034 }, { "epoch": 0.18, "learning_rate": 4.703893419721724e-06, "loss": 1.1836, "step": 6035 }, { "epoch": 0.18, "learning_rate": 4.703778260209708e-06, "loss": 1.0981, "step": 6036 }, { "epoch": 0.18, "learning_rate": 4.7036630797187845e-06, "loss": 1.2242, "step": 6037 }, { "epoch": 0.18, "learning_rate": 4.703547878250049e-06, "loss": 1.1863, "step": 6038 }, { "epoch": 0.18, "learning_rate": 4.7034326558046e-06, "loss": 1.2349, "step": 6039 }, { "epoch": 0.18, "learning_rate": 4.7033174123835335e-06, "loss": 1.1115, "step": 6040 }, { "epoch": 0.18, "learning_rate": 4.703202147987945e-06, "loss": 1.1264, "step": 6041 }, { "epoch": 0.18, "learning_rate": 4.703086862618935e-06, "loss": 1.2047, "step": 6042 }, { "epoch": 0.18, "learning_rate": 4.7029715562775975e-06, "loss": 1.1823, "step": 6043 }, { "epoch": 0.18, "learning_rate": 4.7028562289650335e-06, "loss": 1.1783, "step": 6044 }, { "epoch": 0.18, "learning_rate": 4.7027408806823375e-06, "loss": 1.2213, "step": 6045 }, { "epoch": 0.18, "learning_rate": 4.70262551143061e-06, "loss": 1.1268, "step": 6046 }, { "epoch": 0.18, "learning_rate": 4.702510121210948e-06, "loss": 1.1603, "step": 6047 }, { "epoch": 0.18, "learning_rate": 4.702394710024451e-06, "loss": 1.1233, "step": 6048 }, { "epoch": 0.18, "learning_rate": 4.702279277872217e-06, "loss": 1.2095, "step": 6049 }, { "epoch": 0.18, "learning_rate": 4.702163824755345e-06, "loss": 0.9932, "step": 6050 }, { "epoch": 0.18, "learning_rate": 4.702048350674934e-06, "loss": 1.0639, "step": 6051 }, { "epoch": 0.18, "learning_rate": 4.701932855632082e-06, "loss": 1.1107, "step": 6052 }, { "epoch": 0.18, "learning_rate": 4.701817339627891e-06, "loss": 1.1934, "step": 6053 }, { "epoch": 0.18, "learning_rate": 4.701701802663459e-06, "loss": 1.2224, "step": 6054 }, { "epoch": 0.18, "learning_rate": 4.701586244739886e-06, "loss": 1.1568, "step": 6055 }, { "epoch": 0.18, "learning_rate": 4.701470665858273e-06, "loss": 1.1664, "step": 6056 }, { "epoch": 0.18, "learning_rate": 4.701355066019718e-06, "loss": 1.1407, "step": 6057 }, { "epoch": 0.18, "learning_rate": 4.701239445225324e-06, "loss": 1.1475, "step": 6058 }, { "epoch": 0.18, "learning_rate": 4.701123803476191e-06, "loss": 1.155, "step": 6059 }, { "epoch": 0.18, "learning_rate": 4.701008140773419e-06, "loss": 1.1644, "step": 6060 }, { "epoch": 0.18, "learning_rate": 4.70089245711811e-06, "loss": 1.1801, "step": 6061 }, { "epoch": 0.18, "learning_rate": 4.700776752511364e-06, "loss": 1.1155, "step": 6062 }, { "epoch": 0.18, "learning_rate": 4.700661026954284e-06, "loss": 1.1768, "step": 6063 }, { "epoch": 0.18, "learning_rate": 4.70054528044797e-06, "loss": 1.1472, "step": 6064 }, { "epoch": 0.18, "learning_rate": 4.700429512993526e-06, "loss": 1.1413, "step": 6065 }, { "epoch": 0.18, "learning_rate": 4.700313724592051e-06, "loss": 1.1224, "step": 6066 }, { "epoch": 0.18, "learning_rate": 4.700197915244651e-06, "loss": 1.2635, "step": 6067 }, { "epoch": 0.18, "learning_rate": 4.700082084952426e-06, "loss": 1.1256, "step": 6068 }, { "epoch": 0.18, "learning_rate": 4.699966233716479e-06, "loss": 1.2435, "step": 6069 }, { "epoch": 0.18, "learning_rate": 4.699850361537913e-06, "loss": 1.0928, "step": 6070 }, { "epoch": 0.18, "learning_rate": 4.6997344684178305e-06, "loss": 1.254, "step": 6071 }, { "epoch": 0.18, "learning_rate": 4.699618554357336e-06, "loss": 1.1265, "step": 6072 }, { "epoch": 0.18, "learning_rate": 4.699502619357532e-06, "loss": 1.1863, "step": 6073 }, { "epoch": 0.18, "learning_rate": 4.699386663419522e-06, "loss": 1.0863, "step": 6074 }, { "epoch": 0.18, "learning_rate": 4.699270686544411e-06, "loss": 1.2307, "step": 6075 }, { "epoch": 0.18, "learning_rate": 4.699154688733301e-06, "loss": 1.1932, "step": 6076 }, { "epoch": 0.18, "learning_rate": 4.699038669987298e-06, "loss": 1.0869, "step": 6077 }, { "epoch": 0.18, "learning_rate": 4.698922630307506e-06, "loss": 1.0054, "step": 6078 }, { "epoch": 0.18, "learning_rate": 4.698806569695031e-06, "loss": 1.0997, "step": 6079 }, { "epoch": 0.18, "learning_rate": 4.698690488150974e-06, "loss": 1.1984, "step": 6080 }, { "epoch": 0.18, "learning_rate": 4.698574385676445e-06, "loss": 1.291, "step": 6081 }, { "epoch": 0.18, "learning_rate": 4.698458262272545e-06, "loss": 1.0887, "step": 6082 }, { "epoch": 0.18, "learning_rate": 4.698342117940382e-06, "loss": 1.2169, "step": 6083 }, { "epoch": 0.18, "learning_rate": 4.69822595268106e-06, "loss": 1.1005, "step": 6084 }, { "epoch": 0.18, "learning_rate": 4.698109766495686e-06, "loss": 1.0764, "step": 6085 }, { "epoch": 0.18, "learning_rate": 4.697993559385365e-06, "loss": 1.1885, "step": 6086 }, { "epoch": 0.18, "learning_rate": 4.697877331351205e-06, "loss": 1.0737, "step": 6087 }, { "epoch": 0.18, "learning_rate": 4.697761082394311e-06, "loss": 1.2357, "step": 6088 }, { "epoch": 0.18, "learning_rate": 4.697644812515791e-06, "loss": 1.022, "step": 6089 }, { "epoch": 0.18, "learning_rate": 4.697528521716749e-06, "loss": 1.1382, "step": 6090 }, { "epoch": 0.18, "learning_rate": 4.697412209998294e-06, "loss": 1.1857, "step": 6091 }, { "epoch": 0.18, "learning_rate": 4.697295877361534e-06, "loss": 1.1494, "step": 6092 }, { "epoch": 0.18, "learning_rate": 4.697179523807575e-06, "loss": 1.0682, "step": 6093 }, { "epoch": 0.18, "learning_rate": 4.697063149337525e-06, "loss": 1.1638, "step": 6094 }, { "epoch": 0.18, "learning_rate": 4.696946753952492e-06, "loss": 1.1447, "step": 6095 }, { "epoch": 0.18, "learning_rate": 4.696830337653585e-06, "loss": 1.136, "step": 6096 }, { "epoch": 0.18, "learning_rate": 4.69671390044191e-06, "loss": 1.1783, "step": 6097 }, { "epoch": 0.18, "learning_rate": 4.6965974423185774e-06, "loss": 1.2366, "step": 6098 }, { "epoch": 0.18, "learning_rate": 4.696480963284695e-06, "loss": 1.2075, "step": 6099 }, { "epoch": 0.18, "learning_rate": 4.696364463341371e-06, "loss": 1.1708, "step": 6100 }, { "epoch": 0.18, "learning_rate": 4.696247942489716e-06, "loss": 1.1642, "step": 6101 }, { "epoch": 0.18, "learning_rate": 4.696131400730838e-06, "loss": 1.0643, "step": 6102 }, { "epoch": 0.18, "learning_rate": 4.696014838065847e-06, "loss": 1.1078, "step": 6103 }, { "epoch": 0.18, "learning_rate": 4.695898254495851e-06, "loss": 1.1877, "step": 6104 }, { "epoch": 0.18, "learning_rate": 4.695781650021963e-06, "loss": 1.1584, "step": 6105 }, { "epoch": 0.18, "learning_rate": 4.69566502464529e-06, "loss": 1.1155, "step": 6106 }, { "epoch": 0.18, "learning_rate": 4.695548378366944e-06, "loss": 1.1788, "step": 6107 }, { "epoch": 0.18, "learning_rate": 4.695431711188035e-06, "loss": 1.1043, "step": 6108 }, { "epoch": 0.18, "learning_rate": 4.6953150231096735e-06, "loss": 1.0053, "step": 6109 }, { "epoch": 0.18, "learning_rate": 4.69519831413297e-06, "loss": 1.1325, "step": 6110 }, { "epoch": 0.18, "learning_rate": 4.695081584259036e-06, "loss": 1.1252, "step": 6111 }, { "epoch": 0.18, "learning_rate": 4.694964833488982e-06, "loss": 1.2996, "step": 6112 }, { "epoch": 0.18, "learning_rate": 4.69484806182392e-06, "loss": 1.0649, "step": 6113 }, { "epoch": 0.18, "learning_rate": 4.694731269264961e-06, "loss": 1.1658, "step": 6114 }, { "epoch": 0.18, "learning_rate": 4.694614455813219e-06, "loss": 1.2858, "step": 6115 }, { "epoch": 0.18, "learning_rate": 4.694497621469803e-06, "loss": 1.1785, "step": 6116 }, { "epoch": 0.18, "learning_rate": 4.694380766235827e-06, "loss": 1.2003, "step": 6117 }, { "epoch": 0.18, "learning_rate": 4.694263890112402e-06, "loss": 1.1086, "step": 6118 }, { "epoch": 0.18, "learning_rate": 4.694146993100643e-06, "loss": 1.1475, "step": 6119 }, { "epoch": 0.18, "learning_rate": 4.694030075201661e-06, "loss": 1.1421, "step": 6120 }, { "epoch": 0.18, "learning_rate": 4.693913136416569e-06, "loss": 1.1693, "step": 6121 }, { "epoch": 0.18, "learning_rate": 4.693796176746481e-06, "loss": 1.1555, "step": 6122 }, { "epoch": 0.18, "learning_rate": 4.69367919619251e-06, "loss": 1.2262, "step": 6123 }, { "epoch": 0.18, "learning_rate": 4.6935621947557695e-06, "loss": 1.0751, "step": 6124 }, { "epoch": 0.18, "learning_rate": 4.693445172437373e-06, "loss": 1.2383, "step": 6125 }, { "epoch": 0.18, "learning_rate": 4.693328129238435e-06, "loss": 1.1082, "step": 6126 }, { "epoch": 0.18, "learning_rate": 4.693211065160069e-06, "loss": 1.1544, "step": 6127 }, { "epoch": 0.18, "learning_rate": 4.693093980203391e-06, "loss": 1.0047, "step": 6128 }, { "epoch": 0.18, "learning_rate": 4.6929768743695134e-06, "loss": 1.0098, "step": 6129 }, { "epoch": 0.18, "learning_rate": 4.692859747659553e-06, "loss": 1.1819, "step": 6130 }, { "epoch": 0.18, "learning_rate": 4.692742600074624e-06, "loss": 1.1636, "step": 6131 }, { "epoch": 0.18, "learning_rate": 4.6926254316158414e-06, "loss": 1.2405, "step": 6132 }, { "epoch": 0.18, "learning_rate": 4.692508242284321e-06, "loss": 1.126, "step": 6133 }, { "epoch": 0.18, "learning_rate": 4.692391032081177e-06, "loss": 1.1113, "step": 6134 }, { "epoch": 0.18, "learning_rate": 4.692273801007526e-06, "loss": 1.1782, "step": 6135 }, { "epoch": 0.18, "learning_rate": 4.692156549064486e-06, "loss": 1.1912, "step": 6136 }, { "epoch": 0.18, "learning_rate": 4.69203927625317e-06, "loss": 1.1695, "step": 6137 }, { "epoch": 0.18, "learning_rate": 4.691921982574697e-06, "loss": 1.232, "step": 6138 }, { "epoch": 0.18, "learning_rate": 4.691804668030182e-06, "loss": 1.1476, "step": 6139 }, { "epoch": 0.18, "learning_rate": 4.691687332620741e-06, "loss": 1.0894, "step": 6140 }, { "epoch": 0.18, "learning_rate": 4.691569976347493e-06, "loss": 1.2771, "step": 6141 }, { "epoch": 0.19, "learning_rate": 4.6914525992115545e-06, "loss": 1.2604, "step": 6142 }, { "epoch": 0.19, "learning_rate": 4.691335201214043e-06, "loss": 1.2037, "step": 6143 }, { "epoch": 0.19, "learning_rate": 4.691217782356075e-06, "loss": 1.1414, "step": 6144 }, { "epoch": 0.19, "learning_rate": 4.69110034263877e-06, "loss": 1.0715, "step": 6145 }, { "epoch": 0.19, "learning_rate": 4.690982882063244e-06, "loss": 1.2649, "step": 6146 }, { "epoch": 0.19, "learning_rate": 4.690865400630616e-06, "loss": 1.1815, "step": 6147 }, { "epoch": 0.19, "learning_rate": 4.690747898342005e-06, "loss": 1.2058, "step": 6148 }, { "epoch": 0.19, "learning_rate": 4.69063037519853e-06, "loss": 1.2069, "step": 6149 }, { "epoch": 0.19, "learning_rate": 4.690512831201308e-06, "loss": 1.1721, "step": 6150 }, { "epoch": 0.19, "learning_rate": 4.690395266351458e-06, "loss": 1.1747, "step": 6151 }, { "epoch": 0.19, "learning_rate": 4.690277680650101e-06, "loss": 1.192, "step": 6152 }, { "epoch": 0.19, "learning_rate": 4.690160074098356e-06, "loss": 1.1038, "step": 6153 }, { "epoch": 0.19, "learning_rate": 4.690042446697342e-06, "loss": 1.1885, "step": 6154 }, { "epoch": 0.19, "learning_rate": 4.689924798448177e-06, "loss": 1.1699, "step": 6155 }, { "epoch": 0.19, "learning_rate": 4.689807129351984e-06, "loss": 1.1321, "step": 6156 }, { "epoch": 0.19, "learning_rate": 4.689689439409881e-06, "loss": 1.0947, "step": 6157 }, { "epoch": 0.19, "learning_rate": 4.689571728622989e-06, "loss": 1.0423, "step": 6158 }, { "epoch": 0.19, "learning_rate": 4.689453996992429e-06, "loss": 0.9735, "step": 6159 }, { "epoch": 0.19, "learning_rate": 4.689336244519322e-06, "loss": 1.0319, "step": 6160 }, { "epoch": 0.19, "learning_rate": 4.689218471204787e-06, "loss": 1.2474, "step": 6161 }, { "epoch": 0.19, "learning_rate": 4.689100677049948e-06, "loss": 1.1189, "step": 6162 }, { "epoch": 0.19, "learning_rate": 4.688982862055924e-06, "loss": 1.1134, "step": 6163 }, { "epoch": 0.19, "learning_rate": 4.688865026223838e-06, "loss": 1.0871, "step": 6164 }, { "epoch": 0.19, "learning_rate": 4.68874716955481e-06, "loss": 1.1793, "step": 6165 }, { "epoch": 0.19, "learning_rate": 4.688629292049964e-06, "loss": 1.1665, "step": 6166 }, { "epoch": 0.19, "learning_rate": 4.688511393710421e-06, "loss": 1.1242, "step": 6167 }, { "epoch": 0.19, "learning_rate": 4.688393474537304e-06, "loss": 1.1467, "step": 6168 }, { "epoch": 0.19, "learning_rate": 4.688275534531735e-06, "loss": 1.066, "step": 6169 }, { "epoch": 0.19, "learning_rate": 4.688157573694837e-06, "loss": 1.1446, "step": 6170 }, { "epoch": 0.19, "learning_rate": 4.688039592027731e-06, "loss": 1.197, "step": 6171 }, { "epoch": 0.19, "learning_rate": 4.6879215895315436e-06, "loss": 1.2003, "step": 6172 }, { "epoch": 0.19, "learning_rate": 4.687803566207396e-06, "loss": 1.2406, "step": 6173 }, { "epoch": 0.19, "learning_rate": 4.687685522056412e-06, "loss": 1.1993, "step": 6174 }, { "epoch": 0.19, "learning_rate": 4.687567457079716e-06, "loss": 1.1898, "step": 6175 }, { "epoch": 0.19, "learning_rate": 4.687449371278431e-06, "loss": 1.1987, "step": 6176 }, { "epoch": 0.19, "learning_rate": 4.6873312646536815e-06, "loss": 1.1035, "step": 6177 }, { "epoch": 0.19, "learning_rate": 4.687213137206592e-06, "loss": 1.1984, "step": 6178 }, { "epoch": 0.19, "learning_rate": 4.687094988938286e-06, "loss": 1.1273, "step": 6179 }, { "epoch": 0.19, "learning_rate": 4.68697681984989e-06, "loss": 1.1282, "step": 6180 }, { "epoch": 0.19, "learning_rate": 4.686858629942527e-06, "loss": 1.1938, "step": 6181 }, { "epoch": 0.19, "learning_rate": 4.686740419217324e-06, "loss": 1.1481, "step": 6182 }, { "epoch": 0.19, "learning_rate": 4.686622187675405e-06, "loss": 1.1643, "step": 6183 }, { "epoch": 0.19, "learning_rate": 4.686503935317896e-06, "loss": 1.1766, "step": 6184 }, { "epoch": 0.19, "learning_rate": 4.686385662145922e-06, "loss": 1.1493, "step": 6185 }, { "epoch": 0.19, "learning_rate": 4.686267368160611e-06, "loss": 1.1347, "step": 6186 }, { "epoch": 0.19, "learning_rate": 4.686149053363086e-06, "loss": 1.1126, "step": 6187 }, { "epoch": 0.19, "learning_rate": 4.686030717754476e-06, "loss": 1.0924, "step": 6188 }, { "epoch": 0.19, "learning_rate": 4.685912361335906e-06, "loss": 1.1661, "step": 6189 }, { "epoch": 0.19, "learning_rate": 4.685793984108503e-06, "loss": 1.0546, "step": 6190 }, { "epoch": 0.19, "learning_rate": 4.685675586073394e-06, "loss": 1.1114, "step": 6191 }, { "epoch": 0.19, "learning_rate": 4.685557167231706e-06, "loss": 1.1512, "step": 6192 }, { "epoch": 0.19, "learning_rate": 4.685438727584566e-06, "loss": 1.1241, "step": 6193 }, { "epoch": 0.19, "learning_rate": 4.6853202671331025e-06, "loss": 1.2205, "step": 6194 }, { "epoch": 0.19, "learning_rate": 4.685201785878442e-06, "loss": 1.1959, "step": 6195 }, { "epoch": 0.19, "learning_rate": 4.685083283821713e-06, "loss": 1.0831, "step": 6196 }, { "epoch": 0.19, "learning_rate": 4.684964760964044e-06, "loss": 1.0858, "step": 6197 }, { "epoch": 0.19, "learning_rate": 4.684846217306563e-06, "loss": 1.0947, "step": 6198 }, { "epoch": 0.19, "learning_rate": 4.6847276528503975e-06, "loss": 1.1157, "step": 6199 }, { "epoch": 0.19, "learning_rate": 4.684609067596677e-06, "loss": 1.1168, "step": 6200 }, { "epoch": 0.19, "learning_rate": 4.684490461546532e-06, "loss": 1.1225, "step": 6201 }, { "epoch": 0.19, "learning_rate": 4.684371834701087e-06, "loss": 1.1141, "step": 6202 }, { "epoch": 0.19, "learning_rate": 4.684253187061476e-06, "loss": 1.2032, "step": 6203 }, { "epoch": 0.19, "learning_rate": 4.684134518628827e-06, "loss": 1.1334, "step": 6204 }, { "epoch": 0.19, "learning_rate": 4.684015829404268e-06, "loss": 1.2772, "step": 6205 }, { "epoch": 0.19, "learning_rate": 4.683897119388931e-06, "loss": 1.1996, "step": 6206 }, { "epoch": 0.19, "learning_rate": 4.683778388583945e-06, "loss": 1.2452, "step": 6207 }, { "epoch": 0.19, "learning_rate": 4.68365963699044e-06, "loss": 1.1804, "step": 6208 }, { "epoch": 0.19, "learning_rate": 4.683540864609548e-06, "loss": 1.2017, "step": 6209 }, { "epoch": 0.19, "learning_rate": 4.683422071442397e-06, "loss": 1.1575, "step": 6210 }, { "epoch": 0.19, "learning_rate": 4.683303257490121e-06, "loss": 1.174, "step": 6211 }, { "epoch": 0.19, "learning_rate": 4.683184422753849e-06, "loss": 1.2759, "step": 6212 }, { "epoch": 0.19, "learning_rate": 4.683065567234712e-06, "loss": 1.1222, "step": 6213 }, { "epoch": 0.19, "learning_rate": 4.682946690933844e-06, "loss": 1.1201, "step": 6214 }, { "epoch": 0.19, "learning_rate": 4.682827793852373e-06, "loss": 1.2097, "step": 6215 }, { "epoch": 0.19, "learning_rate": 4.6827088759914345e-06, "loss": 1.1957, "step": 6216 }, { "epoch": 0.19, "learning_rate": 4.682589937352157e-06, "loss": 1.2517, "step": 6217 }, { "epoch": 0.19, "learning_rate": 4.682470977935675e-06, "loss": 1.2003, "step": 6218 }, { "epoch": 0.19, "learning_rate": 4.682351997743121e-06, "loss": 1.2034, "step": 6219 }, { "epoch": 0.19, "learning_rate": 4.682232996775626e-06, "loss": 1.0353, "step": 6220 }, { "epoch": 0.19, "learning_rate": 4.682113975034324e-06, "loss": 1.1487, "step": 6221 }, { "epoch": 0.19, "learning_rate": 4.681994932520349e-06, "loss": 1.1345, "step": 6222 }, { "epoch": 0.19, "learning_rate": 4.681875869234833e-06, "loss": 1.1998, "step": 6223 }, { "epoch": 0.19, "learning_rate": 4.681756785178909e-06, "loss": 1.3082, "step": 6224 }, { "epoch": 0.19, "learning_rate": 4.681637680353711e-06, "loss": 1.0995, "step": 6225 }, { "epoch": 0.19, "learning_rate": 4.681518554760372e-06, "loss": 1.0731, "step": 6226 }, { "epoch": 0.19, "learning_rate": 4.681399408400029e-06, "loss": 1.1368, "step": 6227 }, { "epoch": 0.19, "learning_rate": 4.681280241273814e-06, "loss": 1.1413, "step": 6228 }, { "epoch": 0.19, "learning_rate": 4.681161053382861e-06, "loss": 1.1925, "step": 6229 }, { "epoch": 0.19, "learning_rate": 4.681041844728305e-06, "loss": 1.1924, "step": 6230 }, { "epoch": 0.19, "learning_rate": 4.680922615311281e-06, "loss": 1.3188, "step": 6231 }, { "epoch": 0.19, "learning_rate": 4.680803365132925e-06, "loss": 1.0345, "step": 6232 }, { "epoch": 0.19, "learning_rate": 4.680684094194371e-06, "loss": 1.0759, "step": 6233 }, { "epoch": 0.19, "learning_rate": 4.680564802496754e-06, "loss": 1.0794, "step": 6234 }, { "epoch": 0.19, "learning_rate": 4.680445490041211e-06, "loss": 1.1174, "step": 6235 }, { "epoch": 0.19, "learning_rate": 4.680326156828876e-06, "loss": 1.1259, "step": 6236 }, { "epoch": 0.19, "learning_rate": 4.6802068028608874e-06, "loss": 1.2006, "step": 6237 }, { "epoch": 0.19, "learning_rate": 4.68008742813838e-06, "loss": 1.0464, "step": 6238 }, { "epoch": 0.19, "learning_rate": 4.679968032662489e-06, "loss": 1.1044, "step": 6239 }, { "epoch": 0.19, "learning_rate": 4.679848616434353e-06, "loss": 1.193, "step": 6240 }, { "epoch": 0.19, "learning_rate": 4.679729179455108e-06, "loss": 1.1121, "step": 6241 }, { "epoch": 0.19, "learning_rate": 4.679609721725891e-06, "loss": 1.2039, "step": 6242 }, { "epoch": 0.19, "learning_rate": 4.679490243247839e-06, "loss": 1.1028, "step": 6243 }, { "epoch": 0.19, "learning_rate": 4.67937074402209e-06, "loss": 1.0853, "step": 6244 }, { "epoch": 0.19, "learning_rate": 4.679251224049781e-06, "loss": 1.1216, "step": 6245 }, { "epoch": 0.19, "learning_rate": 4.67913168333205e-06, "loss": 1.1195, "step": 6246 }, { "epoch": 0.19, "learning_rate": 4.679012121870035e-06, "loss": 1.0891, "step": 6247 }, { "epoch": 0.19, "learning_rate": 4.678892539664873e-06, "loss": 1.0762, "step": 6248 }, { "epoch": 0.19, "learning_rate": 4.678772936717705e-06, "loss": 1.2192, "step": 6249 }, { "epoch": 0.19, "learning_rate": 4.678653313029667e-06, "loss": 1.1683, "step": 6250 }, { "epoch": 0.19, "learning_rate": 4.678533668601899e-06, "loss": 1.1249, "step": 6251 }, { "epoch": 0.19, "learning_rate": 4.678414003435539e-06, "loss": 1.1621, "step": 6252 }, { "epoch": 0.19, "learning_rate": 4.678294317531728e-06, "loss": 1.2095, "step": 6253 }, { "epoch": 0.19, "learning_rate": 4.678174610891603e-06, "loss": 1.0165, "step": 6254 }, { "epoch": 0.19, "learning_rate": 4.678054883516306e-06, "loss": 1.1461, "step": 6255 }, { "epoch": 0.19, "learning_rate": 4.6779351354069746e-06, "loss": 1.0939, "step": 6256 }, { "epoch": 0.19, "learning_rate": 4.6778153665647494e-06, "loss": 1.0897, "step": 6257 }, { "epoch": 0.19, "learning_rate": 4.677695576990772e-06, "loss": 1.1312, "step": 6258 }, { "epoch": 0.19, "learning_rate": 4.67757576668618e-06, "loss": 1.0255, "step": 6259 }, { "epoch": 0.19, "learning_rate": 4.677455935652117e-06, "loss": 1.0821, "step": 6260 }, { "epoch": 0.19, "learning_rate": 4.677336083889721e-06, "loss": 1.1464, "step": 6261 }, { "epoch": 0.19, "learning_rate": 4.677216211400135e-06, "loss": 1.2416, "step": 6262 }, { "epoch": 0.19, "learning_rate": 4.677096318184498e-06, "loss": 1.1683, "step": 6263 }, { "epoch": 0.19, "learning_rate": 4.676976404243954e-06, "loss": 1.2074, "step": 6264 }, { "epoch": 0.19, "learning_rate": 4.676856469579643e-06, "loss": 1.0652, "step": 6265 }, { "epoch": 0.19, "learning_rate": 4.676736514192706e-06, "loss": 1.1134, "step": 6266 }, { "epoch": 0.19, "learning_rate": 4.676616538084286e-06, "loss": 1.1063, "step": 6267 }, { "epoch": 0.19, "learning_rate": 4.6764965412555245e-06, "loss": 1.1873, "step": 6268 }, { "epoch": 0.19, "learning_rate": 4.676376523707565e-06, "loss": 1.1339, "step": 6269 }, { "epoch": 0.19, "learning_rate": 4.676256485441548e-06, "loss": 1.1952, "step": 6270 }, { "epoch": 0.19, "learning_rate": 4.676136426458618e-06, "loss": 1.1686, "step": 6271 }, { "epoch": 0.19, "learning_rate": 4.676016346759918e-06, "loss": 1.2288, "step": 6272 }, { "epoch": 0.19, "learning_rate": 4.6758962463465895e-06, "loss": 1.2402, "step": 6273 }, { "epoch": 0.19, "learning_rate": 4.675776125219778e-06, "loss": 1.1708, "step": 6274 }, { "epoch": 0.19, "learning_rate": 4.675655983380624e-06, "loss": 1.1986, "step": 6275 }, { "epoch": 0.19, "learning_rate": 4.675535820830274e-06, "loss": 1.1311, "step": 6276 }, { "epoch": 0.19, "learning_rate": 4.67541563756987e-06, "loss": 1.1041, "step": 6277 }, { "epoch": 0.19, "learning_rate": 4.675295433600557e-06, "loss": 1.0995, "step": 6278 }, { "epoch": 0.19, "learning_rate": 4.675175208923479e-06, "loss": 1.1075, "step": 6279 }, { "epoch": 0.19, "learning_rate": 4.675054963539782e-06, "loss": 1.1735, "step": 6280 }, { "epoch": 0.19, "learning_rate": 4.674934697450607e-06, "loss": 1.157, "step": 6281 }, { "epoch": 0.19, "learning_rate": 4.674814410657103e-06, "loss": 1.1932, "step": 6282 }, { "epoch": 0.19, "learning_rate": 4.674694103160412e-06, "loss": 1.041, "step": 6283 }, { "epoch": 0.19, "learning_rate": 4.674573774961681e-06, "loss": 1.1832, "step": 6284 }, { "epoch": 0.19, "learning_rate": 4.674453426062055e-06, "loss": 1.1148, "step": 6285 }, { "epoch": 0.19, "learning_rate": 4.67433305646268e-06, "loss": 1.1854, "step": 6286 }, { "epoch": 0.19, "learning_rate": 4.674212666164701e-06, "loss": 1.165, "step": 6287 }, { "epoch": 0.19, "learning_rate": 4.6740922551692645e-06, "loss": 1.111, "step": 6288 }, { "epoch": 0.19, "learning_rate": 4.673971823477517e-06, "loss": 1.1728, "step": 6289 }, { "epoch": 0.19, "learning_rate": 4.6738513710906056e-06, "loss": 1.1368, "step": 6290 }, { "epoch": 0.19, "learning_rate": 4.6737308980096755e-06, "loss": 1.1997, "step": 6291 }, { "epoch": 0.19, "learning_rate": 4.673610404235873e-06, "loss": 1.2446, "step": 6292 }, { "epoch": 0.19, "learning_rate": 4.673489889770347e-06, "loss": 1.0296, "step": 6293 }, { "epoch": 0.19, "learning_rate": 4.673369354614244e-06, "loss": 1.0687, "step": 6294 }, { "epoch": 0.19, "learning_rate": 4.673248798768713e-06, "loss": 1.133, "step": 6295 }, { "epoch": 0.19, "learning_rate": 4.673128222234899e-06, "loss": 1.1075, "step": 6296 }, { "epoch": 0.19, "learning_rate": 4.67300762501395e-06, "loss": 1.1751, "step": 6297 }, { "epoch": 0.19, "learning_rate": 4.672887007107016e-06, "loss": 1.3054, "step": 6298 }, { "epoch": 0.19, "learning_rate": 4.672766368515244e-06, "loss": 1.3577, "step": 6299 }, { "epoch": 0.19, "learning_rate": 4.672645709239783e-06, "loss": 1.2408, "step": 6300 }, { "epoch": 0.19, "learning_rate": 4.6725250292817805e-06, "loss": 1.1215, "step": 6301 }, { "epoch": 0.19, "learning_rate": 4.672404328642386e-06, "loss": 1.1655, "step": 6302 }, { "epoch": 0.19, "learning_rate": 4.67228360732275e-06, "loss": 1.1832, "step": 6303 }, { "epoch": 0.19, "learning_rate": 4.672162865324018e-06, "loss": 1.163, "step": 6304 }, { "epoch": 0.19, "learning_rate": 4.672042102647343e-06, "loss": 1.1478, "step": 6305 }, { "epoch": 0.19, "learning_rate": 4.671921319293873e-06, "loss": 1.1296, "step": 6306 }, { "epoch": 0.19, "learning_rate": 4.671800515264758e-06, "loss": 1.229, "step": 6307 }, { "epoch": 0.19, "learning_rate": 4.671679690561149e-06, "loss": 1.1771, "step": 6308 }, { "epoch": 0.19, "learning_rate": 4.671558845184194e-06, "loss": 1.1591, "step": 6309 }, { "epoch": 0.19, "learning_rate": 4.6714379791350455e-06, "loss": 1.1564, "step": 6310 }, { "epoch": 0.19, "learning_rate": 4.671317092414853e-06, "loss": 1.2029, "step": 6311 }, { "epoch": 0.19, "learning_rate": 4.6711961850247675e-06, "loss": 1.0497, "step": 6312 }, { "epoch": 0.19, "learning_rate": 4.67107525696594e-06, "loss": 1.108, "step": 6313 }, { "epoch": 0.19, "learning_rate": 4.670954308239521e-06, "loss": 1.1147, "step": 6314 }, { "epoch": 0.19, "learning_rate": 4.670833338846664e-06, "loss": 1.1793, "step": 6315 }, { "epoch": 0.19, "learning_rate": 4.6707123487885186e-06, "loss": 1.0615, "step": 6316 }, { "epoch": 0.19, "learning_rate": 4.670591338066237e-06, "loss": 1.3019, "step": 6317 }, { "epoch": 0.19, "learning_rate": 4.6704703066809705e-06, "loss": 1.1761, "step": 6318 }, { "epoch": 0.19, "learning_rate": 4.670349254633872e-06, "loss": 1.1495, "step": 6319 }, { "epoch": 0.19, "learning_rate": 4.670228181926094e-06, "loss": 1.121, "step": 6320 }, { "epoch": 0.19, "learning_rate": 4.67010708855879e-06, "loss": 1.2013, "step": 6321 }, { "epoch": 0.19, "learning_rate": 4.669985974533111e-06, "loss": 1.0524, "step": 6322 }, { "epoch": 0.19, "learning_rate": 4.669864839850211e-06, "loss": 1.1231, "step": 6323 }, { "epoch": 0.19, "learning_rate": 4.669743684511243e-06, "loss": 1.098, "step": 6324 }, { "epoch": 0.19, "learning_rate": 4.6696225085173585e-06, "loss": 1.1555, "step": 6325 }, { "epoch": 0.19, "learning_rate": 4.669501311869714e-06, "loss": 1.1455, "step": 6326 }, { "epoch": 0.19, "learning_rate": 4.669380094569462e-06, "loss": 1.1067, "step": 6327 }, { "epoch": 0.19, "learning_rate": 4.669258856617756e-06, "loss": 1.0129, "step": 6328 }, { "epoch": 0.19, "learning_rate": 4.66913759801575e-06, "loss": 1.1857, "step": 6329 }, { "epoch": 0.19, "learning_rate": 4.6690163187645995e-06, "loss": 1.2083, "step": 6330 }, { "epoch": 0.19, "learning_rate": 4.668895018865457e-06, "loss": 1.2468, "step": 6331 }, { "epoch": 0.19, "learning_rate": 4.66877369831948e-06, "loss": 1.1464, "step": 6332 }, { "epoch": 0.19, "learning_rate": 4.668652357127821e-06, "loss": 1.1322, "step": 6333 }, { "epoch": 0.19, "learning_rate": 4.668530995291636e-06, "loss": 1.116, "step": 6334 }, { "epoch": 0.19, "learning_rate": 4.668409612812081e-06, "loss": 1.2815, "step": 6335 }, { "epoch": 0.19, "learning_rate": 4.66828820969031e-06, "loss": 1.1312, "step": 6336 }, { "epoch": 0.19, "learning_rate": 4.6681667859274805e-06, "loss": 1.2634, "step": 6337 }, { "epoch": 0.19, "learning_rate": 4.668045341524747e-06, "loss": 1.2189, "step": 6338 }, { "epoch": 0.19, "learning_rate": 4.667923876483266e-06, "loss": 1.2358, "step": 6339 }, { "epoch": 0.19, "learning_rate": 4.667802390804193e-06, "loss": 1.1954, "step": 6340 }, { "epoch": 0.19, "learning_rate": 4.667680884488686e-06, "loss": 1.1887, "step": 6341 }, { "epoch": 0.19, "learning_rate": 4.667559357537901e-06, "loss": 1.1665, "step": 6342 }, { "epoch": 0.19, "learning_rate": 4.667437809952995e-06, "loss": 1.1925, "step": 6343 }, { "epoch": 0.19, "learning_rate": 4.667316241735125e-06, "loss": 1.2452, "step": 6344 }, { "epoch": 0.19, "learning_rate": 4.667194652885447e-06, "loss": 1.0715, "step": 6345 }, { "epoch": 0.19, "learning_rate": 4.667073043405122e-06, "loss": 1.1987, "step": 6346 }, { "epoch": 0.19, "learning_rate": 4.666951413295303e-06, "loss": 1.1071, "step": 6347 }, { "epoch": 0.19, "learning_rate": 4.666829762557151e-06, "loss": 1.1168, "step": 6348 }, { "epoch": 0.19, "learning_rate": 4.666708091191824e-06, "loss": 1.1008, "step": 6349 }, { "epoch": 0.19, "learning_rate": 4.666586399200478e-06, "loss": 1.1757, "step": 6350 }, { "epoch": 0.19, "learning_rate": 4.666464686584274e-06, "loss": 1.0391, "step": 6351 }, { "epoch": 0.19, "learning_rate": 4.66634295334437e-06, "loss": 1.0966, "step": 6352 }, { "epoch": 0.19, "learning_rate": 4.6662211994819235e-06, "loss": 1.1302, "step": 6353 }, { "epoch": 0.19, "learning_rate": 4.666099424998094e-06, "loss": 1.1306, "step": 6354 }, { "epoch": 0.19, "learning_rate": 4.665977629894043e-06, "loss": 1.0934, "step": 6355 }, { "epoch": 0.19, "learning_rate": 4.665855814170927e-06, "loss": 1.1838, "step": 6356 }, { "epoch": 0.19, "learning_rate": 4.665733977829907e-06, "loss": 1.1639, "step": 6357 }, { "epoch": 0.19, "learning_rate": 4.665612120872142e-06, "loss": 1.144, "step": 6358 }, { "epoch": 0.19, "learning_rate": 4.665490243298793e-06, "loss": 1.1686, "step": 6359 }, { "epoch": 0.19, "learning_rate": 4.66536834511102e-06, "loss": 1.0964, "step": 6360 }, { "epoch": 0.19, "learning_rate": 4.665246426309983e-06, "loss": 1.1398, "step": 6361 }, { "epoch": 0.19, "learning_rate": 4.665124486896842e-06, "loss": 1.1609, "step": 6362 }, { "epoch": 0.19, "learning_rate": 4.66500252687276e-06, "loss": 1.183, "step": 6363 }, { "epoch": 0.19, "learning_rate": 4.664880546238897e-06, "loss": 1.256, "step": 6364 }, { "epoch": 0.19, "learning_rate": 4.6647585449964125e-06, "loss": 1.2186, "step": 6365 }, { "epoch": 0.19, "learning_rate": 4.6646365231464704e-06, "loss": 1.1567, "step": 6366 }, { "epoch": 0.19, "learning_rate": 4.66451448069023e-06, "loss": 1.1709, "step": 6367 }, { "epoch": 0.19, "learning_rate": 4.6643924176288556e-06, "loss": 1.2751, "step": 6368 }, { "epoch": 0.19, "learning_rate": 4.664270333963506e-06, "loss": 1.1044, "step": 6369 }, { "epoch": 0.19, "learning_rate": 4.664148229695347e-06, "loss": 1.1501, "step": 6370 }, { "epoch": 0.19, "learning_rate": 4.664026104825537e-06, "loss": 1.1169, "step": 6371 }, { "epoch": 0.19, "learning_rate": 4.663903959355242e-06, "loss": 1.0407, "step": 6372 }, { "epoch": 0.19, "learning_rate": 4.663781793285624e-06, "loss": 1.0406, "step": 6373 }, { "epoch": 0.19, "learning_rate": 4.6636596066178455e-06, "loss": 1.3184, "step": 6374 }, { "epoch": 0.19, "learning_rate": 4.663537399353069e-06, "loss": 1.2096, "step": 6375 }, { "epoch": 0.19, "learning_rate": 4.663415171492458e-06, "loss": 1.0483, "step": 6376 }, { "epoch": 0.19, "learning_rate": 4.663292923037177e-06, "loss": 1.187, "step": 6377 }, { "epoch": 0.19, "learning_rate": 4.663170653988389e-06, "loss": 1.1412, "step": 6378 }, { "epoch": 0.19, "learning_rate": 4.663048364347259e-06, "loss": 1.1689, "step": 6379 }, { "epoch": 0.19, "learning_rate": 4.662926054114949e-06, "loss": 1.1491, "step": 6380 }, { "epoch": 0.19, "learning_rate": 4.662803723292625e-06, "loss": 1.3429, "step": 6381 }, { "epoch": 0.19, "learning_rate": 4.662681371881453e-06, "loss": 1.2332, "step": 6382 }, { "epoch": 0.19, "learning_rate": 4.662558999882594e-06, "loss": 1.1196, "step": 6383 }, { "epoch": 0.19, "learning_rate": 4.662436607297215e-06, "loss": 1.1493, "step": 6384 }, { "epoch": 0.19, "learning_rate": 4.662314194126481e-06, "loss": 1.1243, "step": 6385 }, { "epoch": 0.19, "learning_rate": 4.6621917603715576e-06, "loss": 1.0696, "step": 6386 }, { "epoch": 0.19, "learning_rate": 4.6620693060336095e-06, "loss": 1.1041, "step": 6387 }, { "epoch": 0.19, "learning_rate": 4.6619468311138035e-06, "loss": 1.2606, "step": 6388 }, { "epoch": 0.19, "learning_rate": 4.661824335613305e-06, "loss": 1.171, "step": 6389 }, { "epoch": 0.19, "learning_rate": 4.66170181953328e-06, "loss": 1.1198, "step": 6390 }, { "epoch": 0.19, "learning_rate": 4.661579282874895e-06, "loss": 1.1244, "step": 6391 }, { "epoch": 0.19, "learning_rate": 4.661456725639316e-06, "loss": 1.0927, "step": 6392 }, { "epoch": 0.19, "learning_rate": 4.66133414782771e-06, "loss": 1.2139, "step": 6393 }, { "epoch": 0.19, "learning_rate": 4.661211549441243e-06, "loss": 1.1141, "step": 6394 }, { "epoch": 0.19, "learning_rate": 4.661088930481084e-06, "loss": 1.1528, "step": 6395 }, { "epoch": 0.19, "learning_rate": 4.6609662909483985e-06, "loss": 1.1959, "step": 6396 }, { "epoch": 0.19, "learning_rate": 4.660843630844355e-06, "loss": 1.236, "step": 6397 }, { "epoch": 0.19, "learning_rate": 4.66072095017012e-06, "loss": 1.1173, "step": 6398 }, { "epoch": 0.19, "learning_rate": 4.660598248926863e-06, "loss": 1.2988, "step": 6399 }, { "epoch": 0.19, "learning_rate": 4.660475527115752e-06, "loss": 1.1335, "step": 6400 }, { "epoch": 0.19, "learning_rate": 4.660352784737953e-06, "loss": 1.0759, "step": 6401 }, { "epoch": 0.19, "learning_rate": 4.6602300217946374e-06, "loss": 1.0911, "step": 6402 }, { "epoch": 0.19, "learning_rate": 4.660107238286971e-06, "loss": 1.129, "step": 6403 }, { "epoch": 0.19, "learning_rate": 4.659984434216125e-06, "loss": 1.087, "step": 6404 }, { "epoch": 0.19, "learning_rate": 4.659861609583267e-06, "loss": 1.2203, "step": 6405 }, { "epoch": 0.19, "learning_rate": 4.659738764389567e-06, "loss": 1.199, "step": 6406 }, { "epoch": 0.19, "learning_rate": 4.659615898636194e-06, "loss": 1.1078, "step": 6407 }, { "epoch": 0.19, "learning_rate": 4.6594930123243176e-06, "loss": 1.1613, "step": 6408 }, { "epoch": 0.19, "learning_rate": 4.6593701054551075e-06, "loss": 1.0734, "step": 6409 }, { "epoch": 0.19, "learning_rate": 4.659247178029735e-06, "loss": 1.1064, "step": 6410 }, { "epoch": 0.19, "learning_rate": 4.6591242300493685e-06, "loss": 1.1447, "step": 6411 }, { "epoch": 0.19, "learning_rate": 4.659001261515179e-06, "loss": 1.2029, "step": 6412 }, { "epoch": 0.19, "learning_rate": 4.658878272428337e-06, "loss": 1.2205, "step": 6413 }, { "epoch": 0.19, "learning_rate": 4.658755262790016e-06, "loss": 1.1693, "step": 6414 }, { "epoch": 0.19, "learning_rate": 4.658632232601382e-06, "loss": 1.2242, "step": 6415 }, { "epoch": 0.19, "learning_rate": 4.65850918186361e-06, "loss": 1.0232, "step": 6416 }, { "epoch": 0.19, "learning_rate": 4.6583861105778696e-06, "loss": 1.1895, "step": 6417 }, { "epoch": 0.19, "learning_rate": 4.658263018745333e-06, "loss": 1.1328, "step": 6418 }, { "epoch": 0.19, "learning_rate": 4.658139906367172e-06, "loss": 1.2146, "step": 6419 }, { "epoch": 0.19, "learning_rate": 4.658016773444559e-06, "loss": 1.1527, "step": 6420 }, { "epoch": 0.19, "learning_rate": 4.657893619978665e-06, "loss": 1.036, "step": 6421 }, { "epoch": 0.19, "learning_rate": 4.657770445970663e-06, "loss": 1.1577, "step": 6422 }, { "epoch": 0.19, "learning_rate": 4.657647251421726e-06, "loss": 1.1597, "step": 6423 }, { "epoch": 0.19, "learning_rate": 4.6575240363330265e-06, "loss": 1.1523, "step": 6424 }, { "epoch": 0.19, "learning_rate": 4.657400800705737e-06, "loss": 1.1481, "step": 6425 }, { "epoch": 0.19, "learning_rate": 4.657277544541031e-06, "loss": 1.2001, "step": 6426 }, { "epoch": 0.19, "learning_rate": 4.657154267840081e-06, "loss": 1.0788, "step": 6427 }, { "epoch": 0.19, "learning_rate": 4.6570309706040615e-06, "loss": 1.098, "step": 6428 }, { "epoch": 0.19, "learning_rate": 4.656907652834147e-06, "loss": 1.179, "step": 6429 }, { "epoch": 0.19, "learning_rate": 4.6567843145315095e-06, "loss": 1.1599, "step": 6430 }, { "epoch": 0.19, "learning_rate": 4.656660955697325e-06, "loss": 1.1887, "step": 6431 }, { "epoch": 0.19, "learning_rate": 4.6565375763327655e-06, "loss": 1.1917, "step": 6432 }, { "epoch": 0.19, "learning_rate": 4.6564141764390085e-06, "loss": 1.1337, "step": 6433 }, { "epoch": 0.19, "learning_rate": 4.656290756017226e-06, "loss": 1.2053, "step": 6434 }, { "epoch": 0.19, "learning_rate": 4.656167315068594e-06, "loss": 1.1355, "step": 6435 }, { "epoch": 0.19, "learning_rate": 4.656043853594288e-06, "loss": 1.108, "step": 6436 }, { "epoch": 0.19, "learning_rate": 4.655920371595483e-06, "loss": 1.2715, "step": 6437 }, { "epoch": 0.19, "learning_rate": 4.655796869073354e-06, "loss": 1.1313, "step": 6438 }, { "epoch": 0.19, "learning_rate": 4.655673346029077e-06, "loss": 1.0955, "step": 6439 }, { "epoch": 0.19, "learning_rate": 4.655549802463828e-06, "loss": 1.118, "step": 6440 }, { "epoch": 0.19, "learning_rate": 4.655426238378784e-06, "loss": 1.2083, "step": 6441 }, { "epoch": 0.19, "learning_rate": 4.655302653775119e-06, "loss": 1.1293, "step": 6442 }, { "epoch": 0.19, "learning_rate": 4.655179048654011e-06, "loss": 1.2015, "step": 6443 }, { "epoch": 0.19, "learning_rate": 4.655055423016638e-06, "loss": 1.1449, "step": 6444 }, { "epoch": 0.19, "learning_rate": 4.654931776864174e-06, "loss": 1.2233, "step": 6445 }, { "epoch": 0.19, "learning_rate": 4.654808110197797e-06, "loss": 1.1429, "step": 6446 }, { "epoch": 0.19, "learning_rate": 4.654684423018685e-06, "loss": 1.1337, "step": 6447 }, { "epoch": 0.19, "learning_rate": 4.6545607153280146e-06, "loss": 1.218, "step": 6448 }, { "epoch": 0.19, "learning_rate": 4.654436987126965e-06, "loss": 1.1779, "step": 6449 }, { "epoch": 0.19, "learning_rate": 4.654313238416712e-06, "loss": 1.0595, "step": 6450 }, { "epoch": 0.19, "learning_rate": 4.6541894691984345e-06, "loss": 1.0853, "step": 6451 }, { "epoch": 0.19, "learning_rate": 4.654065679473311e-06, "loss": 1.1646, "step": 6452 }, { "epoch": 0.19, "learning_rate": 4.653941869242519e-06, "loss": 1.1299, "step": 6453 }, { "epoch": 0.19, "learning_rate": 4.653818038507239e-06, "loss": 0.9478, "step": 6454 }, { "epoch": 0.19, "learning_rate": 4.653694187268648e-06, "loss": 1.2415, "step": 6455 }, { "epoch": 0.19, "learning_rate": 4.653570315527925e-06, "loss": 1.2132, "step": 6456 }, { "epoch": 0.19, "learning_rate": 4.65344642328625e-06, "loss": 1.1462, "step": 6457 }, { "epoch": 0.19, "learning_rate": 4.653322510544803e-06, "loss": 1.1907, "step": 6458 }, { "epoch": 0.19, "learning_rate": 4.6531985773047625e-06, "loss": 1.009, "step": 6459 }, { "epoch": 0.19, "learning_rate": 4.653074623567308e-06, "loss": 1.2145, "step": 6460 }, { "epoch": 0.19, "learning_rate": 4.652950649333621e-06, "loss": 1.2587, "step": 6461 }, { "epoch": 0.19, "learning_rate": 4.65282665460488e-06, "loss": 1.1519, "step": 6462 }, { "epoch": 0.19, "learning_rate": 4.652702639382265e-06, "loss": 1.0361, "step": 6463 }, { "epoch": 0.19, "learning_rate": 4.652578603666959e-06, "loss": 1.0625, "step": 6464 }, { "epoch": 0.19, "learning_rate": 4.652454547460142e-06, "loss": 1.0466, "step": 6465 }, { "epoch": 0.19, "learning_rate": 4.652330470762994e-06, "loss": 1.0929, "step": 6466 }, { "epoch": 0.19, "learning_rate": 4.652206373576695e-06, "loss": 1.1005, "step": 6467 }, { "epoch": 0.19, "learning_rate": 4.652082255902429e-06, "loss": 1.2032, "step": 6468 }, { "epoch": 0.19, "learning_rate": 4.651958117741377e-06, "loss": 1.0323, "step": 6469 }, { "epoch": 0.19, "learning_rate": 4.65183395909472e-06, "loss": 1.1655, "step": 6470 }, { "epoch": 0.19, "learning_rate": 4.651709779963639e-06, "loss": 1.1345, "step": 6471 }, { "epoch": 0.19, "learning_rate": 4.6515855803493175e-06, "loss": 1.2031, "step": 6472 }, { "epoch": 0.19, "learning_rate": 4.651461360252938e-06, "loss": 1.2526, "step": 6473 }, { "epoch": 0.2, "learning_rate": 4.651337119675683e-06, "loss": 1.1569, "step": 6474 }, { "epoch": 0.2, "learning_rate": 4.651212858618733e-06, "loss": 1.1479, "step": 6475 }, { "epoch": 0.2, "learning_rate": 4.651088577083273e-06, "loss": 1.1428, "step": 6476 }, { "epoch": 0.2, "learning_rate": 4.650964275070488e-06, "loss": 1.1967, "step": 6477 }, { "epoch": 0.2, "learning_rate": 4.650839952581556e-06, "loss": 1.0869, "step": 6478 }, { "epoch": 0.2, "learning_rate": 4.650715609617666e-06, "loss": 1.2408, "step": 6479 }, { "epoch": 0.2, "learning_rate": 4.6505912461799985e-06, "loss": 1.0402, "step": 6480 }, { "epoch": 0.2, "learning_rate": 4.650466862269738e-06, "loss": 1.2397, "step": 6481 }, { "epoch": 0.2, "learning_rate": 4.650342457888068e-06, "loss": 1.1207, "step": 6482 }, { "epoch": 0.2, "learning_rate": 4.650218033036174e-06, "loss": 1.0825, "step": 6483 }, { "epoch": 0.2, "learning_rate": 4.65009358771524e-06, "loss": 1.136, "step": 6484 }, { "epoch": 0.2, "learning_rate": 4.64996912192645e-06, "loss": 1.0883, "step": 6485 }, { "epoch": 0.2, "learning_rate": 4.64984463567099e-06, "loss": 1.0546, "step": 6486 }, { "epoch": 0.2, "learning_rate": 4.649720128950045e-06, "loss": 1.3011, "step": 6487 }, { "epoch": 0.2, "learning_rate": 4.649595601764799e-06, "loss": 1.1349, "step": 6488 }, { "epoch": 0.2, "learning_rate": 4.649471054116438e-06, "loss": 1.1378, "step": 6489 }, { "epoch": 0.2, "learning_rate": 4.649346486006148e-06, "loss": 1.1547, "step": 6490 }, { "epoch": 0.2, "learning_rate": 4.6492218974351145e-06, "loss": 1.1117, "step": 6491 }, { "epoch": 0.2, "learning_rate": 4.649097288404523e-06, "loss": 1.1149, "step": 6492 }, { "epoch": 0.2, "learning_rate": 4.648972658915562e-06, "loss": 1.1061, "step": 6493 }, { "epoch": 0.2, "learning_rate": 4.648848008969415e-06, "loss": 1.2819, "step": 6494 }, { "epoch": 0.2, "learning_rate": 4.6487233385672705e-06, "loss": 1.1508, "step": 6495 }, { "epoch": 0.2, "learning_rate": 4.648598647710314e-06, "loss": 1.1783, "step": 6496 }, { "epoch": 0.2, "learning_rate": 4.6484739363997334e-06, "loss": 1.0952, "step": 6497 }, { "epoch": 0.2, "learning_rate": 4.648349204636717e-06, "loss": 1.1713, "step": 6498 }, { "epoch": 0.2, "learning_rate": 4.648224452422448e-06, "loss": 1.1146, "step": 6499 }, { "epoch": 0.2, "learning_rate": 4.648099679758119e-06, "loss": 1.1114, "step": 6500 }, { "epoch": 0.2, "learning_rate": 4.647974886644916e-06, "loss": 1.1121, "step": 6501 }, { "epoch": 0.2, "learning_rate": 4.6478500730840244e-06, "loss": 1.1425, "step": 6502 }, { "epoch": 0.2, "learning_rate": 4.647725239076636e-06, "loss": 1.0457, "step": 6503 }, { "epoch": 0.2, "learning_rate": 4.647600384623938e-06, "loss": 1.1294, "step": 6504 }, { "epoch": 0.2, "learning_rate": 4.6474755097271185e-06, "loss": 1.1575, "step": 6505 }, { "epoch": 0.2, "learning_rate": 4.6473506143873655e-06, "loss": 1.109, "step": 6506 }, { "epoch": 0.2, "learning_rate": 4.647225698605869e-06, "loss": 1.1056, "step": 6507 }, { "epoch": 0.2, "learning_rate": 4.647100762383819e-06, "loss": 1.122, "step": 6508 }, { "epoch": 0.2, "learning_rate": 4.646975805722404e-06, "loss": 1.1921, "step": 6509 }, { "epoch": 0.2, "learning_rate": 4.646850828622812e-06, "loss": 1.1771, "step": 6510 }, { "epoch": 0.2, "learning_rate": 4.646725831086235e-06, "loss": 1.1516, "step": 6511 }, { "epoch": 0.2, "learning_rate": 4.6466008131138616e-06, "loss": 1.2342, "step": 6512 }, { "epoch": 0.2, "learning_rate": 4.646475774706882e-06, "loss": 1.1928, "step": 6513 }, { "epoch": 0.2, "learning_rate": 4.646350715866488e-06, "loss": 1.1842, "step": 6514 }, { "epoch": 0.2, "learning_rate": 4.646225636593867e-06, "loss": 1.2189, "step": 6515 }, { "epoch": 0.2, "learning_rate": 4.6461005368902135e-06, "loss": 1.0963, "step": 6516 }, { "epoch": 0.2, "learning_rate": 4.645975416756715e-06, "loss": 1.2164, "step": 6517 }, { "epoch": 0.2, "learning_rate": 4.6458502761945655e-06, "loss": 1.1509, "step": 6518 }, { "epoch": 0.2, "learning_rate": 4.645725115204954e-06, "loss": 1.222, "step": 6519 }, { "epoch": 0.2, "learning_rate": 4.645599933789072e-06, "loss": 1.1953, "step": 6520 }, { "epoch": 0.2, "learning_rate": 4.645474731948113e-06, "loss": 1.0972, "step": 6521 }, { "epoch": 0.2, "learning_rate": 4.645349509683268e-06, "loss": 1.1224, "step": 6522 }, { "epoch": 0.2, "learning_rate": 4.645224266995729e-06, "loss": 1.1941, "step": 6523 }, { "epoch": 0.2, "learning_rate": 4.645099003886688e-06, "loss": 1.2103, "step": 6524 }, { "epoch": 0.2, "learning_rate": 4.644973720357338e-06, "loss": 1.208, "step": 6525 }, { "epoch": 0.2, "learning_rate": 4.64484841640887e-06, "loss": 1.1377, "step": 6526 }, { "epoch": 0.2, "learning_rate": 4.644723092042479e-06, "loss": 1.1297, "step": 6527 }, { "epoch": 0.2, "learning_rate": 4.644597747259356e-06, "loss": 1.0501, "step": 6528 }, { "epoch": 0.2, "learning_rate": 4.644472382060696e-06, "loss": 1.1139, "step": 6529 }, { "epoch": 0.2, "learning_rate": 4.644346996447692e-06, "loss": 1.1168, "step": 6530 }, { "epoch": 0.2, "learning_rate": 4.644221590421537e-06, "loss": 1.1234, "step": 6531 }, { "epoch": 0.2, "learning_rate": 4.644096163983426e-06, "loss": 1.147, "step": 6532 }, { "epoch": 0.2, "learning_rate": 4.6439707171345515e-06, "loss": 1.1333, "step": 6533 }, { "epoch": 0.2, "learning_rate": 4.643845249876109e-06, "loss": 1.0096, "step": 6534 }, { "epoch": 0.2, "learning_rate": 4.643719762209291e-06, "loss": 1.1662, "step": 6535 }, { "epoch": 0.2, "learning_rate": 4.6435942541352945e-06, "loss": 1.1241, "step": 6536 }, { "epoch": 0.2, "learning_rate": 4.643468725655312e-06, "loss": 1.2147, "step": 6537 }, { "epoch": 0.2, "learning_rate": 4.643343176770539e-06, "loss": 1.1275, "step": 6538 }, { "epoch": 0.2, "learning_rate": 4.643217607482173e-06, "loss": 1.2446, "step": 6539 }, { "epoch": 0.2, "learning_rate": 4.643092017791407e-06, "loss": 1.0646, "step": 6540 }, { "epoch": 0.2, "learning_rate": 4.6429664076994375e-06, "loss": 1.1403, "step": 6541 }, { "epoch": 0.2, "learning_rate": 4.642840777207459e-06, "loss": 1.1469, "step": 6542 }, { "epoch": 0.2, "learning_rate": 4.642715126316669e-06, "loss": 1.1619, "step": 6543 }, { "epoch": 0.2, "learning_rate": 4.642589455028263e-06, "loss": 1.1624, "step": 6544 }, { "epoch": 0.2, "learning_rate": 4.642463763343436e-06, "loss": 1.132, "step": 6545 }, { "epoch": 0.2, "learning_rate": 4.642338051263387e-06, "loss": 1.0916, "step": 6546 }, { "epoch": 0.2, "learning_rate": 4.642212318789311e-06, "loss": 1.1855, "step": 6547 }, { "epoch": 0.2, "learning_rate": 4.6420865659224065e-06, "loss": 1.1411, "step": 6548 }, { "epoch": 0.2, "learning_rate": 4.641960792663869e-06, "loss": 1.0718, "step": 6549 }, { "epoch": 0.2, "learning_rate": 4.641834999014896e-06, "loss": 1.0993, "step": 6550 }, { "epoch": 0.2, "learning_rate": 4.641709184976685e-06, "loss": 1.2005, "step": 6551 }, { "epoch": 0.2, "learning_rate": 4.641583350550435e-06, "loss": 1.1191, "step": 6552 }, { "epoch": 0.2, "learning_rate": 4.641457495737342e-06, "loss": 1.0878, "step": 6553 }, { "epoch": 0.2, "learning_rate": 4.641331620538606e-06, "loss": 1.0281, "step": 6554 }, { "epoch": 0.2, "learning_rate": 4.641205724955424e-06, "loss": 1.1522, "step": 6555 }, { "epoch": 0.2, "learning_rate": 4.641079808988994e-06, "loss": 1.2603, "step": 6556 }, { "epoch": 0.2, "learning_rate": 4.640953872640516e-06, "loss": 1.1884, "step": 6557 }, { "epoch": 0.2, "learning_rate": 4.640827915911188e-06, "loss": 1.0817, "step": 6558 }, { "epoch": 0.2, "learning_rate": 4.64070193880221e-06, "loss": 1.2012, "step": 6559 }, { "epoch": 0.2, "learning_rate": 4.64057594131478e-06, "loss": 1.1287, "step": 6560 }, { "epoch": 0.2, "learning_rate": 4.640449923450098e-06, "loss": 1.1721, "step": 6561 }, { "epoch": 0.2, "learning_rate": 4.640323885209363e-06, "loss": 1.0233, "step": 6562 }, { "epoch": 0.2, "learning_rate": 4.6401978265937765e-06, "loss": 1.149, "step": 6563 }, { "epoch": 0.2, "learning_rate": 4.640071747604537e-06, "loss": 1.1736, "step": 6564 }, { "epoch": 0.2, "learning_rate": 4.639945648242845e-06, "loss": 1.1611, "step": 6565 }, { "epoch": 0.2, "learning_rate": 4.639819528509901e-06, "loss": 1.1732, "step": 6566 }, { "epoch": 0.2, "learning_rate": 4.639693388406906e-06, "loss": 1.1744, "step": 6567 }, { "epoch": 0.2, "learning_rate": 4.63956722793506e-06, "loss": 1.0314, "step": 6568 }, { "epoch": 0.2, "learning_rate": 4.639441047095565e-06, "loss": 1.0974, "step": 6569 }, { "epoch": 0.2, "learning_rate": 4.639314845889622e-06, "loss": 1.0571, "step": 6570 }, { "epoch": 0.2, "learning_rate": 4.639188624318431e-06, "loss": 1.1373, "step": 6571 }, { "epoch": 0.2, "learning_rate": 4.639062382383195e-06, "loss": 1.3024, "step": 6572 }, { "epoch": 0.2, "learning_rate": 4.638936120085115e-06, "loss": 1.205, "step": 6573 }, { "epoch": 0.2, "learning_rate": 4.638809837425394e-06, "loss": 1.188, "step": 6574 }, { "epoch": 0.2, "learning_rate": 4.638683534405233e-06, "loss": 1.2054, "step": 6575 }, { "epoch": 0.2, "learning_rate": 4.638557211025835e-06, "loss": 1.1296, "step": 6576 }, { "epoch": 0.2, "learning_rate": 4.638430867288402e-06, "loss": 1.1488, "step": 6577 }, { "epoch": 0.2, "learning_rate": 4.638304503194137e-06, "loss": 1.1835, "step": 6578 }, { "epoch": 0.2, "learning_rate": 4.6381781187442425e-06, "loss": 1.2279, "step": 6579 }, { "epoch": 0.2, "learning_rate": 4.638051713939923e-06, "loss": 1.1982, "step": 6580 }, { "epoch": 0.2, "learning_rate": 4.637925288782381e-06, "loss": 1.0681, "step": 6581 }, { "epoch": 0.2, "learning_rate": 4.637798843272819e-06, "loss": 1.1772, "step": 6582 }, { "epoch": 0.2, "learning_rate": 4.637672377412442e-06, "loss": 1.0604, "step": 6583 }, { "epoch": 0.2, "learning_rate": 4.637545891202454e-06, "loss": 1.1252, "step": 6584 }, { "epoch": 0.2, "learning_rate": 4.637419384644058e-06, "loss": 1.2355, "step": 6585 }, { "epoch": 0.2, "learning_rate": 4.637292857738459e-06, "loss": 1.1322, "step": 6586 }, { "epoch": 0.2, "learning_rate": 4.637166310486861e-06, "loss": 1.3287, "step": 6587 }, { "epoch": 0.2, "learning_rate": 4.63703974289047e-06, "loss": 1.1775, "step": 6588 }, { "epoch": 0.2, "learning_rate": 4.636913154950489e-06, "loss": 1.1455, "step": 6589 }, { "epoch": 0.2, "learning_rate": 4.636786546668125e-06, "loss": 1.1683, "step": 6590 }, { "epoch": 0.2, "learning_rate": 4.636659918044581e-06, "loss": 1.0551, "step": 6591 }, { "epoch": 0.2, "learning_rate": 4.6365332690810635e-06, "loss": 1.1669, "step": 6592 }, { "epoch": 0.2, "learning_rate": 4.636406599778779e-06, "loss": 1.1301, "step": 6593 }, { "epoch": 0.2, "learning_rate": 4.636279910138933e-06, "loss": 1.1796, "step": 6594 }, { "epoch": 0.2, "learning_rate": 4.6361532001627305e-06, "loss": 1.2083, "step": 6595 }, { "epoch": 0.2, "learning_rate": 4.636026469851379e-06, "loss": 1.1459, "step": 6596 }, { "epoch": 0.2, "learning_rate": 4.6358997192060826e-06, "loss": 1.07, "step": 6597 }, { "epoch": 0.2, "learning_rate": 4.635772948228051e-06, "loss": 1.1901, "step": 6598 }, { "epoch": 0.2, "learning_rate": 4.63564615691849e-06, "loss": 1.0654, "step": 6599 }, { "epoch": 0.2, "learning_rate": 4.6355193452786045e-06, "loss": 1.1463, "step": 6600 }, { "epoch": 0.2, "learning_rate": 4.635392513309605e-06, "loss": 1.0695, "step": 6601 }, { "epoch": 0.2, "learning_rate": 4.6352656610126955e-06, "loss": 1.2184, "step": 6602 }, { "epoch": 0.2, "learning_rate": 4.635138788389087e-06, "loss": 1.2266, "step": 6603 }, { "epoch": 0.2, "learning_rate": 4.635011895439984e-06, "loss": 1.1367, "step": 6604 }, { "epoch": 0.2, "learning_rate": 4.634884982166596e-06, "loss": 1.2079, "step": 6605 }, { "epoch": 0.2, "learning_rate": 4.634758048570132e-06, "loss": 1.21, "step": 6606 }, { "epoch": 0.2, "learning_rate": 4.6346310946518e-06, "loss": 1.2242, "step": 6607 }, { "epoch": 0.2, "learning_rate": 4.634504120412807e-06, "loss": 1.1139, "step": 6608 }, { "epoch": 0.2, "learning_rate": 4.634377125854363e-06, "loss": 1.2144, "step": 6609 }, { "epoch": 0.2, "learning_rate": 4.634250110977678e-06, "loss": 1.2016, "step": 6610 }, { "epoch": 0.2, "learning_rate": 4.634123075783958e-06, "loss": 1.3132, "step": 6611 }, { "epoch": 0.2, "learning_rate": 4.633996020274415e-06, "loss": 1.2676, "step": 6612 }, { "epoch": 0.2, "learning_rate": 4.633868944450258e-06, "loss": 1.1647, "step": 6613 }, { "epoch": 0.2, "learning_rate": 4.633741848312696e-06, "loss": 1.0416, "step": 6614 }, { "epoch": 0.2, "learning_rate": 4.6336147318629395e-06, "loss": 1.1407, "step": 6615 }, { "epoch": 0.2, "learning_rate": 4.633487595102198e-06, "loss": 1.1558, "step": 6616 }, { "epoch": 0.2, "learning_rate": 4.633360438031682e-06, "loss": 1.1115, "step": 6617 }, { "epoch": 0.2, "learning_rate": 4.633233260652602e-06, "loss": 1.1548, "step": 6618 }, { "epoch": 0.2, "learning_rate": 4.63310606296617e-06, "loss": 1.1301, "step": 6619 }, { "epoch": 0.2, "learning_rate": 4.6329788449735935e-06, "loss": 1.0604, "step": 6620 }, { "epoch": 0.2, "learning_rate": 4.6328516066760874e-06, "loss": 1.1842, "step": 6621 }, { "epoch": 0.2, "learning_rate": 4.632724348074861e-06, "loss": 1.2369, "step": 6622 }, { "epoch": 0.2, "learning_rate": 4.632597069171125e-06, "loss": 1.251, "step": 6623 }, { "epoch": 0.2, "learning_rate": 4.632469769966093e-06, "loss": 1.2104, "step": 6624 }, { "epoch": 0.2, "learning_rate": 4.632342450460975e-06, "loss": 1.0437, "step": 6625 }, { "epoch": 0.2, "learning_rate": 4.6322151106569844e-06, "loss": 1.1103, "step": 6626 }, { "epoch": 0.2, "learning_rate": 4.6320877505553325e-06, "loss": 1.1885, "step": 6627 }, { "epoch": 0.2, "learning_rate": 4.631960370157232e-06, "loss": 1.1204, "step": 6628 }, { "epoch": 0.2, "learning_rate": 4.631832969463896e-06, "loss": 1.1393, "step": 6629 }, { "epoch": 0.2, "learning_rate": 4.631705548476537e-06, "loss": 1.1769, "step": 6630 }, { "epoch": 0.2, "learning_rate": 4.631578107196367e-06, "loss": 1.2633, "step": 6631 }, { "epoch": 0.2, "learning_rate": 4.631450645624601e-06, "loss": 1.2109, "step": 6632 }, { "epoch": 0.2, "learning_rate": 4.631323163762451e-06, "loss": 1.1412, "step": 6633 }, { "epoch": 0.2, "learning_rate": 4.631195661611131e-06, "loss": 1.1655, "step": 6634 }, { "epoch": 0.2, "learning_rate": 4.631068139171855e-06, "loss": 1.1516, "step": 6635 }, { "epoch": 0.2, "learning_rate": 4.630940596445835e-06, "loss": 1.1187, "step": 6636 }, { "epoch": 0.2, "learning_rate": 4.630813033434289e-06, "loss": 1.1961, "step": 6637 }, { "epoch": 0.2, "learning_rate": 4.630685450138428e-06, "loss": 1.0699, "step": 6638 }, { "epoch": 0.2, "learning_rate": 4.630557846559468e-06, "loss": 1.1594, "step": 6639 }, { "epoch": 0.2, "learning_rate": 4.630430222698623e-06, "loss": 0.9834, "step": 6640 }, { "epoch": 0.2, "learning_rate": 4.630302578557109e-06, "loss": 1.0652, "step": 6641 }, { "epoch": 0.2, "learning_rate": 4.63017491413614e-06, "loss": 1.1716, "step": 6642 }, { "epoch": 0.2, "learning_rate": 4.6300472294369325e-06, "loss": 1.269, "step": 6643 }, { "epoch": 0.2, "learning_rate": 4.6299195244607e-06, "loss": 1.2179, "step": 6644 }, { "epoch": 0.2, "learning_rate": 4.62979179920866e-06, "loss": 1.1152, "step": 6645 }, { "epoch": 0.2, "learning_rate": 4.629664053682028e-06, "loss": 1.0372, "step": 6646 }, { "epoch": 0.2, "learning_rate": 4.62953628788202e-06, "loss": 1.1129, "step": 6647 }, { "epoch": 0.2, "learning_rate": 4.629408501809852e-06, "loss": 1.1233, "step": 6648 }, { "epoch": 0.2, "learning_rate": 4.62928069546674e-06, "loss": 1.2961, "step": 6649 }, { "epoch": 0.2, "learning_rate": 4.629152868853903e-06, "loss": 1.2009, "step": 6650 }, { "epoch": 0.2, "learning_rate": 4.629025021972554e-06, "loss": 1.3302, "step": 6651 }, { "epoch": 0.2, "learning_rate": 4.6288971548239135e-06, "loss": 1.2111, "step": 6652 }, { "epoch": 0.2, "learning_rate": 4.628769267409197e-06, "loss": 1.2129, "step": 6653 }, { "epoch": 0.2, "learning_rate": 4.628641359729622e-06, "loss": 1.1762, "step": 6654 }, { "epoch": 0.2, "learning_rate": 4.6285134317864065e-06, "loss": 1.1668, "step": 6655 }, { "epoch": 0.2, "learning_rate": 4.628385483580769e-06, "loss": 1.1376, "step": 6656 }, { "epoch": 0.2, "learning_rate": 4.628257515113926e-06, "loss": 1.1445, "step": 6657 }, { "epoch": 0.2, "learning_rate": 4.628129526387097e-06, "loss": 1.1908, "step": 6658 }, { "epoch": 0.2, "learning_rate": 4.6280015174015e-06, "loss": 1.2559, "step": 6659 }, { "epoch": 0.2, "learning_rate": 4.627873488158353e-06, "loss": 1.117, "step": 6660 }, { "epoch": 0.2, "learning_rate": 4.627745438658875e-06, "loss": 1.0901, "step": 6661 }, { "epoch": 0.2, "learning_rate": 4.6276173689042855e-06, "loss": 1.3143, "step": 6662 }, { "epoch": 0.2, "learning_rate": 4.627489278895804e-06, "loss": 1.1906, "step": 6663 }, { "epoch": 0.2, "learning_rate": 4.627361168634648e-06, "loss": 1.1654, "step": 6664 }, { "epoch": 0.2, "learning_rate": 4.627233038122039e-06, "loss": 1.1711, "step": 6665 }, { "epoch": 0.2, "learning_rate": 4.627104887359195e-06, "loss": 1.069, "step": 6666 }, { "epoch": 0.2, "learning_rate": 4.6269767163473375e-06, "loss": 1.1069, "step": 6667 }, { "epoch": 0.2, "learning_rate": 4.626848525087687e-06, "loss": 1.0264, "step": 6668 }, { "epoch": 0.2, "learning_rate": 4.626720313581462e-06, "loss": 1.0717, "step": 6669 }, { "epoch": 0.2, "learning_rate": 4.626592081829883e-06, "loss": 1.1658, "step": 6670 }, { "epoch": 0.2, "learning_rate": 4.626463829834174e-06, "loss": 1.1357, "step": 6671 }, { "epoch": 0.2, "learning_rate": 4.626335557595552e-06, "loss": 1.141, "step": 6672 }, { "epoch": 0.2, "learning_rate": 4.626207265115239e-06, "loss": 1.1829, "step": 6673 }, { "epoch": 0.2, "learning_rate": 4.626078952394457e-06, "loss": 1.1937, "step": 6674 }, { "epoch": 0.2, "learning_rate": 4.625950619434428e-06, "loss": 1.1081, "step": 6675 }, { "epoch": 0.2, "learning_rate": 4.625822266236373e-06, "loss": 1.2022, "step": 6676 }, { "epoch": 0.2, "learning_rate": 4.625693892801513e-06, "loss": 1.1769, "step": 6677 }, { "epoch": 0.2, "learning_rate": 4.625565499131071e-06, "loss": 1.1104, "step": 6678 }, { "epoch": 0.2, "learning_rate": 4.62543708522627e-06, "loss": 1.1611, "step": 6679 }, { "epoch": 0.2, "learning_rate": 4.625308651088332e-06, "loss": 1.2627, "step": 6680 }, { "epoch": 0.2, "learning_rate": 4.625180196718479e-06, "loss": 1.2377, "step": 6681 }, { "epoch": 0.2, "learning_rate": 4.625051722117932e-06, "loss": 1.1228, "step": 6682 }, { "epoch": 0.2, "learning_rate": 4.624923227287918e-06, "loss": 1.0963, "step": 6683 }, { "epoch": 0.2, "learning_rate": 4.624794712229657e-06, "loss": 1.0663, "step": 6684 }, { "epoch": 0.2, "learning_rate": 4.624666176944376e-06, "loss": 1.0696, "step": 6685 }, { "epoch": 0.2, "learning_rate": 4.624537621433295e-06, "loss": 1.1214, "step": 6686 }, { "epoch": 0.2, "learning_rate": 4.624409045697639e-06, "loss": 1.0966, "step": 6687 }, { "epoch": 0.2, "learning_rate": 4.624280449738631e-06, "loss": 1.1366, "step": 6688 }, { "epoch": 0.2, "learning_rate": 4.624151833557497e-06, "loss": 1.0776, "step": 6689 }, { "epoch": 0.2, "learning_rate": 4.624023197155461e-06, "loss": 1.1625, "step": 6690 }, { "epoch": 0.2, "learning_rate": 4.623894540533747e-06, "loss": 1.1073, "step": 6691 }, { "epoch": 0.2, "learning_rate": 4.623765863693579e-06, "loss": 1.1711, "step": 6692 }, { "epoch": 0.2, "learning_rate": 4.623637166636184e-06, "loss": 1.1414, "step": 6693 }, { "epoch": 0.2, "learning_rate": 4.623508449362785e-06, "loss": 1.0314, "step": 6694 }, { "epoch": 0.2, "learning_rate": 4.623379711874609e-06, "loss": 1.1408, "step": 6695 }, { "epoch": 0.2, "learning_rate": 4.623250954172881e-06, "loss": 1.1073, "step": 6696 }, { "epoch": 0.2, "learning_rate": 4.623122176258826e-06, "loss": 1.1188, "step": 6697 }, { "epoch": 0.2, "learning_rate": 4.62299337813367e-06, "loss": 1.3013, "step": 6698 }, { "epoch": 0.2, "learning_rate": 4.62286455979864e-06, "loss": 1.2894, "step": 6699 }, { "epoch": 0.2, "learning_rate": 4.622735721254962e-06, "loss": 1.1348, "step": 6700 }, { "epoch": 0.2, "learning_rate": 4.622606862503862e-06, "loss": 1.1472, "step": 6701 }, { "epoch": 0.2, "learning_rate": 4.622477983546567e-06, "loss": 1.1879, "step": 6702 }, { "epoch": 0.2, "learning_rate": 4.622349084384304e-06, "loss": 1.1716, "step": 6703 }, { "epoch": 0.2, "learning_rate": 4.6222201650183e-06, "loss": 1.112, "step": 6704 }, { "epoch": 0.2, "learning_rate": 4.622091225449781e-06, "loss": 1.1744, "step": 6705 }, { "epoch": 0.2, "learning_rate": 4.621962265679977e-06, "loss": 1.203, "step": 6706 }, { "epoch": 0.2, "learning_rate": 4.621833285710113e-06, "loss": 1.1868, "step": 6707 }, { "epoch": 0.2, "learning_rate": 4.621704285541419e-06, "loss": 1.1667, "step": 6708 }, { "epoch": 0.2, "learning_rate": 4.621575265175122e-06, "loss": 1.0308, "step": 6709 }, { "epoch": 0.2, "learning_rate": 4.62144622461245e-06, "loss": 1.1331, "step": 6710 }, { "epoch": 0.2, "learning_rate": 4.6213171638546315e-06, "loss": 1.2186, "step": 6711 }, { "epoch": 0.2, "learning_rate": 4.621188082902895e-06, "loss": 1.1266, "step": 6712 }, { "epoch": 0.2, "learning_rate": 4.6210589817584704e-06, "loss": 1.0571, "step": 6713 }, { "epoch": 0.2, "learning_rate": 4.620929860422585e-06, "loss": 1.1523, "step": 6714 }, { "epoch": 0.2, "learning_rate": 4.6208007188964685e-06, "loss": 1.1729, "step": 6715 }, { "epoch": 0.2, "learning_rate": 4.620671557181352e-06, "loss": 1.0538, "step": 6716 }, { "epoch": 0.2, "learning_rate": 4.620542375278463e-06, "loss": 1.1679, "step": 6717 }, { "epoch": 0.2, "learning_rate": 4.620413173189031e-06, "loss": 1.0429, "step": 6718 }, { "epoch": 0.2, "learning_rate": 4.620283950914287e-06, "loss": 1.1013, "step": 6719 }, { "epoch": 0.2, "learning_rate": 4.620154708455462e-06, "loss": 1.1149, "step": 6720 }, { "epoch": 0.2, "learning_rate": 4.620025445813785e-06, "loss": 1.1693, "step": 6721 }, { "epoch": 0.2, "learning_rate": 4.619896162990487e-06, "loss": 1.1819, "step": 6722 }, { "epoch": 0.2, "learning_rate": 4.619766859986797e-06, "loss": 1.0968, "step": 6723 }, { "epoch": 0.2, "learning_rate": 4.619637536803949e-06, "loss": 1.1539, "step": 6724 }, { "epoch": 0.2, "learning_rate": 4.619508193443172e-06, "loss": 1.1703, "step": 6725 }, { "epoch": 0.2, "learning_rate": 4.619378829905698e-06, "loss": 1.1324, "step": 6726 }, { "epoch": 0.2, "learning_rate": 4.619249446192758e-06, "loss": 1.2416, "step": 6727 }, { "epoch": 0.2, "learning_rate": 4.619120042305584e-06, "loss": 1.1166, "step": 6728 }, { "epoch": 0.2, "learning_rate": 4.618990618245407e-06, "loss": 1.1979, "step": 6729 }, { "epoch": 0.2, "learning_rate": 4.618861174013462e-06, "loss": 1.2772, "step": 6730 }, { "epoch": 0.2, "learning_rate": 4.618731709610977e-06, "loss": 1.3169, "step": 6731 }, { "epoch": 0.2, "learning_rate": 4.618602225039187e-06, "loss": 1.1354, "step": 6732 }, { "epoch": 0.2, "learning_rate": 4.6184727202993246e-06, "loss": 1.1248, "step": 6733 }, { "epoch": 0.2, "learning_rate": 4.618343195392621e-06, "loss": 1.2361, "step": 6734 }, { "epoch": 0.2, "learning_rate": 4.6182136503203126e-06, "loss": 1.2935, "step": 6735 }, { "epoch": 0.2, "learning_rate": 4.618084085083629e-06, "loss": 1.2274, "step": 6736 }, { "epoch": 0.2, "learning_rate": 4.617954499683805e-06, "loss": 1.267, "step": 6737 }, { "epoch": 0.2, "learning_rate": 4.617824894122075e-06, "loss": 1.183, "step": 6738 }, { "epoch": 0.2, "learning_rate": 4.617695268399671e-06, "loss": 1.1749, "step": 6739 }, { "epoch": 0.2, "learning_rate": 4.617565622517829e-06, "loss": 1.1033, "step": 6740 }, { "epoch": 0.2, "learning_rate": 4.617435956477781e-06, "loss": 1.1224, "step": 6741 }, { "epoch": 0.2, "learning_rate": 4.617306270280763e-06, "loss": 1.1791, "step": 6742 }, { "epoch": 0.2, "learning_rate": 4.6171765639280095e-06, "loss": 1.1437, "step": 6743 }, { "epoch": 0.2, "learning_rate": 4.617046837420755e-06, "loss": 1.1282, "step": 6744 }, { "epoch": 0.2, "learning_rate": 4.616917090760232e-06, "loss": 1.1745, "step": 6745 }, { "epoch": 0.2, "learning_rate": 4.61678732394768e-06, "loss": 1.1023, "step": 6746 }, { "epoch": 0.2, "learning_rate": 4.616657536984331e-06, "loss": 1.1193, "step": 6747 }, { "epoch": 0.2, "learning_rate": 4.616527729871423e-06, "loss": 1.3279, "step": 6748 }, { "epoch": 0.2, "learning_rate": 4.61639790261019e-06, "loss": 1.2006, "step": 6749 }, { "epoch": 0.2, "learning_rate": 4.6162680552018674e-06, "loss": 1.2841, "step": 6750 }, { "epoch": 0.2, "learning_rate": 4.6161381876476925e-06, "loss": 1.0848, "step": 6751 }, { "epoch": 0.2, "learning_rate": 4.6160082999489014e-06, "loss": 1.1678, "step": 6752 }, { "epoch": 0.2, "learning_rate": 4.61587839210673e-06, "loss": 1.1088, "step": 6753 }, { "epoch": 0.2, "learning_rate": 4.615748464122416e-06, "loss": 1.1514, "step": 6754 }, { "epoch": 0.2, "learning_rate": 4.615618515997196e-06, "loss": 1.1161, "step": 6755 }, { "epoch": 0.2, "learning_rate": 4.615488547732305e-06, "loss": 1.2732, "step": 6756 }, { "epoch": 0.2, "learning_rate": 4.6153585593289825e-06, "loss": 1.0648, "step": 6757 }, { "epoch": 0.2, "learning_rate": 4.615228550788466e-06, "loss": 1.2557, "step": 6758 }, { "epoch": 0.2, "learning_rate": 4.615098522111992e-06, "loss": 1.167, "step": 6759 }, { "epoch": 0.2, "learning_rate": 4.6149684733007985e-06, "loss": 1.1243, "step": 6760 }, { "epoch": 0.2, "learning_rate": 4.614838404356124e-06, "loss": 1.0861, "step": 6761 }, { "epoch": 0.2, "learning_rate": 4.6147083152792064e-06, "loss": 1.1375, "step": 6762 }, { "epoch": 0.2, "learning_rate": 4.614578206071284e-06, "loss": 1.1458, "step": 6763 }, { "epoch": 0.2, "learning_rate": 4.6144480767335955e-06, "loss": 1.1053, "step": 6764 }, { "epoch": 0.2, "learning_rate": 4.61431792726738e-06, "loss": 1.0768, "step": 6765 }, { "epoch": 0.2, "learning_rate": 4.614187757673876e-06, "loss": 1.2261, "step": 6766 }, { "epoch": 0.2, "learning_rate": 4.614057567954323e-06, "loss": 1.1862, "step": 6767 }, { "epoch": 0.2, "learning_rate": 4.61392735810996e-06, "loss": 1.1287, "step": 6768 }, { "epoch": 0.2, "learning_rate": 4.613797128142026e-06, "loss": 1.2103, "step": 6769 }, { "epoch": 0.2, "learning_rate": 4.613666878051762e-06, "loss": 1.1317, "step": 6770 }, { "epoch": 0.2, "learning_rate": 4.613536607840406e-06, "loss": 1.0903, "step": 6771 }, { "epoch": 0.2, "learning_rate": 4.613406317509201e-06, "loss": 1.0356, "step": 6772 }, { "epoch": 0.2, "learning_rate": 4.613276007059386e-06, "loss": 1.1151, "step": 6773 }, { "epoch": 0.2, "learning_rate": 4.6131456764922e-06, "loss": 1.139, "step": 6774 }, { "epoch": 0.2, "learning_rate": 4.613015325808885e-06, "loss": 1.1478, "step": 6775 }, { "epoch": 0.2, "learning_rate": 4.612884955010683e-06, "loss": 1.0902, "step": 6776 }, { "epoch": 0.2, "learning_rate": 4.612754564098833e-06, "loss": 1.0364, "step": 6777 }, { "epoch": 0.2, "learning_rate": 4.6126241530745765e-06, "loss": 1.1536, "step": 6778 }, { "epoch": 0.2, "learning_rate": 4.612493721939156e-06, "loss": 1.1719, "step": 6779 }, { "epoch": 0.2, "learning_rate": 4.612363270693812e-06, "loss": 1.1097, "step": 6780 }, { "epoch": 0.2, "learning_rate": 4.612232799339789e-06, "loss": 1.1168, "step": 6781 }, { "epoch": 0.2, "learning_rate": 4.612102307878325e-06, "loss": 1.1505, "step": 6782 }, { "epoch": 0.2, "learning_rate": 4.611971796310665e-06, "loss": 1.1444, "step": 6783 }, { "epoch": 0.2, "learning_rate": 4.6118412646380515e-06, "loss": 1.0792, "step": 6784 }, { "epoch": 0.2, "learning_rate": 4.611710712861725e-06, "loss": 1.1011, "step": 6785 }, { "epoch": 0.2, "learning_rate": 4.61158014098293e-06, "loss": 1.1512, "step": 6786 }, { "epoch": 0.2, "learning_rate": 4.611449549002908e-06, "loss": 1.1867, "step": 6787 }, { "epoch": 0.2, "learning_rate": 4.611318936922905e-06, "loss": 1.0588, "step": 6788 }, { "epoch": 0.2, "learning_rate": 4.6111883047441616e-06, "loss": 1.1316, "step": 6789 }, { "epoch": 0.2, "learning_rate": 4.611057652467923e-06, "loss": 1.1146, "step": 6790 }, { "epoch": 0.2, "learning_rate": 4.610926980095431e-06, "loss": 1.1134, "step": 6791 }, { "epoch": 0.2, "learning_rate": 4.610796287627932e-06, "loss": 1.1244, "step": 6792 }, { "epoch": 0.2, "learning_rate": 4.610665575066668e-06, "loss": 1.1281, "step": 6793 }, { "epoch": 0.2, "learning_rate": 4.610534842412886e-06, "loss": 1.0919, "step": 6794 }, { "epoch": 0.2, "learning_rate": 4.610404089667827e-06, "loss": 1.1606, "step": 6795 }, { "epoch": 0.2, "learning_rate": 4.610273316832738e-06, "loss": 1.185, "step": 6796 }, { "epoch": 0.2, "learning_rate": 4.610142523908864e-06, "loss": 1.0132, "step": 6797 }, { "epoch": 0.2, "learning_rate": 4.610011710897449e-06, "loss": 1.1917, "step": 6798 }, { "epoch": 0.2, "learning_rate": 4.609880877799738e-06, "loss": 1.2404, "step": 6799 }, { "epoch": 0.2, "learning_rate": 4.609750024616978e-06, "loss": 1.1797, "step": 6800 }, { "epoch": 0.2, "learning_rate": 4.609619151350414e-06, "loss": 1.1564, "step": 6801 }, { "epoch": 0.2, "learning_rate": 4.609488258001291e-06, "loss": 1.1041, "step": 6802 }, { "epoch": 0.2, "learning_rate": 4.609357344570856e-06, "loss": 1.1194, "step": 6803 }, { "epoch": 0.2, "learning_rate": 4.6092264110603545e-06, "loss": 1.2216, "step": 6804 }, { "epoch": 0.21, "learning_rate": 4.609095457471035e-06, "loss": 1.2285, "step": 6805 }, { "epoch": 0.21, "learning_rate": 4.608964483804141e-06, "loss": 1.2234, "step": 6806 }, { "epoch": 0.21, "learning_rate": 4.608833490060921e-06, "loss": 1.18, "step": 6807 }, { "epoch": 0.21, "learning_rate": 4.608702476242622e-06, "loss": 1.1864, "step": 6808 }, { "epoch": 0.21, "learning_rate": 4.608571442350491e-06, "loss": 1.1804, "step": 6809 }, { "epoch": 0.21, "learning_rate": 4.608440388385776e-06, "loss": 1.1716, "step": 6810 }, { "epoch": 0.21, "learning_rate": 4.608309314349724e-06, "loss": 1.1943, "step": 6811 }, { "epoch": 0.21, "learning_rate": 4.608178220243582e-06, "loss": 1.2548, "step": 6812 }, { "epoch": 0.21, "learning_rate": 4.608047106068598e-06, "loss": 1.1497, "step": 6813 }, { "epoch": 0.21, "learning_rate": 4.607915971826022e-06, "loss": 1.1098, "step": 6814 }, { "epoch": 0.21, "learning_rate": 4.607784817517101e-06, "loss": 1.1636, "step": 6815 }, { "epoch": 0.21, "learning_rate": 4.607653643143084e-06, "loss": 1.1234, "step": 6816 }, { "epoch": 0.21, "learning_rate": 4.607522448705218e-06, "loss": 1.1091, "step": 6817 }, { "epoch": 0.21, "learning_rate": 4.607391234204755e-06, "loss": 0.9704, "step": 6818 }, { "epoch": 0.21, "learning_rate": 4.607259999642941e-06, "loss": 1.2643, "step": 6819 }, { "epoch": 0.21, "learning_rate": 4.6071287450210275e-06, "loss": 1.1595, "step": 6820 }, { "epoch": 0.21, "learning_rate": 4.606997470340263e-06, "loss": 1.1411, "step": 6821 }, { "epoch": 0.21, "learning_rate": 4.606866175601898e-06, "loss": 1.223, "step": 6822 }, { "epoch": 0.21, "learning_rate": 4.606734860807181e-06, "loss": 1.0151, "step": 6823 }, { "epoch": 0.21, "learning_rate": 4.6066035259573624e-06, "loss": 1.0328, "step": 6824 }, { "epoch": 0.21, "learning_rate": 4.606472171053693e-06, "loss": 1.2269, "step": 6825 }, { "epoch": 0.21, "learning_rate": 4.606340796097424e-06, "loss": 1.1561, "step": 6826 }, { "epoch": 0.21, "learning_rate": 4.606209401089804e-06, "loss": 1.1523, "step": 6827 }, { "epoch": 0.21, "learning_rate": 4.606077986032086e-06, "loss": 1.0871, "step": 6828 }, { "epoch": 0.21, "learning_rate": 4.605946550925519e-06, "loss": 1.1359, "step": 6829 }, { "epoch": 0.21, "learning_rate": 4.605815095771355e-06, "loss": 1.249, "step": 6830 }, { "epoch": 0.21, "learning_rate": 4.605683620570845e-06, "loss": 1.1151, "step": 6831 }, { "epoch": 0.21, "learning_rate": 4.605552125325242e-06, "loss": 1.2499, "step": 6832 }, { "epoch": 0.21, "learning_rate": 4.605420610035797e-06, "loss": 1.0777, "step": 6833 }, { "epoch": 0.21, "learning_rate": 4.605289074703761e-06, "loss": 1.181, "step": 6834 }, { "epoch": 0.21, "learning_rate": 4.605157519330388e-06, "loss": 1.1635, "step": 6835 }, { "epoch": 0.21, "learning_rate": 4.605025943916929e-06, "loss": 1.1056, "step": 6836 }, { "epoch": 0.21, "learning_rate": 4.6048943484646365e-06, "loss": 1.0613, "step": 6837 }, { "epoch": 0.21, "learning_rate": 4.604762732974763e-06, "loss": 1.0573, "step": 6838 }, { "epoch": 0.21, "learning_rate": 4.604631097448563e-06, "loss": 1.1557, "step": 6839 }, { "epoch": 0.21, "learning_rate": 4.604499441887288e-06, "loss": 1.2069, "step": 6840 }, { "epoch": 0.21, "learning_rate": 4.604367766292191e-06, "loss": 1.1516, "step": 6841 }, { "epoch": 0.21, "learning_rate": 4.604236070664528e-06, "loss": 1.1467, "step": 6842 }, { "epoch": 0.21, "learning_rate": 4.604104355005551e-06, "loss": 1.2083, "step": 6843 }, { "epoch": 0.21, "learning_rate": 4.603972619316513e-06, "loss": 1.3035, "step": 6844 }, { "epoch": 0.21, "learning_rate": 4.603840863598669e-06, "loss": 1.1316, "step": 6845 }, { "epoch": 0.21, "learning_rate": 4.603709087853274e-06, "loss": 1.1932, "step": 6846 }, { "epoch": 0.21, "learning_rate": 4.603577292081582e-06, "loss": 1.0573, "step": 6847 }, { "epoch": 0.21, "learning_rate": 4.603445476284845e-06, "loss": 1.1103, "step": 6848 }, { "epoch": 0.21, "learning_rate": 4.603313640464322e-06, "loss": 1.0559, "step": 6849 }, { "epoch": 0.21, "learning_rate": 4.603181784621266e-06, "loss": 1.1301, "step": 6850 }, { "epoch": 0.21, "learning_rate": 4.6030499087569315e-06, "loss": 1.1162, "step": 6851 }, { "epoch": 0.21, "learning_rate": 4.602918012872576e-06, "loss": 1.1002, "step": 6852 }, { "epoch": 0.21, "learning_rate": 4.602786096969453e-06, "loss": 1.1799, "step": 6853 }, { "epoch": 0.21, "learning_rate": 4.602654161048819e-06, "loss": 1.1111, "step": 6854 }, { "epoch": 0.21, "learning_rate": 4.60252220511193e-06, "loss": 1.2352, "step": 6855 }, { "epoch": 0.21, "learning_rate": 4.602390229160043e-06, "loss": 1.0691, "step": 6856 }, { "epoch": 0.21, "learning_rate": 4.602258233194413e-06, "loss": 1.1884, "step": 6857 }, { "epoch": 0.21, "learning_rate": 4.602126217216297e-06, "loss": 1.1576, "step": 6858 }, { "epoch": 0.21, "learning_rate": 4.601994181226952e-06, "loss": 1.1134, "step": 6859 }, { "epoch": 0.21, "learning_rate": 4.601862125227634e-06, "loss": 1.153, "step": 6860 }, { "epoch": 0.21, "learning_rate": 4.601730049219602e-06, "loss": 1.1226, "step": 6861 }, { "epoch": 0.21, "learning_rate": 4.601597953204112e-06, "loss": 1.0668, "step": 6862 }, { "epoch": 0.21, "learning_rate": 4.601465837182421e-06, "loss": 1.2543, "step": 6863 }, { "epoch": 0.21, "learning_rate": 4.601333701155788e-06, "loss": 1.1852, "step": 6864 }, { "epoch": 0.21, "learning_rate": 4.60120154512547e-06, "loss": 1.0687, "step": 6865 }, { "epoch": 0.21, "learning_rate": 4.601069369092725e-06, "loss": 1.3774, "step": 6866 }, { "epoch": 0.21, "learning_rate": 4.6009371730588115e-06, "loss": 1.202, "step": 6867 }, { "epoch": 0.21, "learning_rate": 4.600804957024988e-06, "loss": 1.155, "step": 6868 }, { "epoch": 0.21, "learning_rate": 4.600672720992514e-06, "loss": 1.1752, "step": 6869 }, { "epoch": 0.21, "learning_rate": 4.600540464962646e-06, "loss": 1.1562, "step": 6870 }, { "epoch": 0.21, "learning_rate": 4.600408188936645e-06, "loss": 1.0698, "step": 6871 }, { "epoch": 0.21, "learning_rate": 4.60027589291577e-06, "loss": 1.172, "step": 6872 }, { "epoch": 0.21, "learning_rate": 4.600143576901279e-06, "loss": 1.2339, "step": 6873 }, { "epoch": 0.21, "learning_rate": 4.600011240894434e-06, "loss": 1.1828, "step": 6874 }, { "epoch": 0.21, "learning_rate": 4.599878884896493e-06, "loss": 1.1772, "step": 6875 }, { "epoch": 0.21, "learning_rate": 4.5997465089087155e-06, "loss": 1.1632, "step": 6876 }, { "epoch": 0.21, "learning_rate": 4.599614112932363e-06, "loss": 0.9822, "step": 6877 }, { "epoch": 0.21, "learning_rate": 4.599481696968696e-06, "loss": 1.0499, "step": 6878 }, { "epoch": 0.21, "learning_rate": 4.5993492610189736e-06, "loss": 1.1164, "step": 6879 }, { "epoch": 0.21, "learning_rate": 4.5992168050844575e-06, "loss": 1.0394, "step": 6880 }, { "epoch": 0.21, "learning_rate": 4.599084329166409e-06, "loss": 1.0126, "step": 6881 }, { "epoch": 0.21, "learning_rate": 4.598951833266087e-06, "loss": 1.1019, "step": 6882 }, { "epoch": 0.21, "learning_rate": 4.598819317384757e-06, "loss": 1.0317, "step": 6883 }, { "epoch": 0.21, "learning_rate": 4.5986867815236755e-06, "loss": 1.1071, "step": 6884 }, { "epoch": 0.21, "learning_rate": 4.5985542256841085e-06, "loss": 1.1033, "step": 6885 }, { "epoch": 0.21, "learning_rate": 4.598421649867315e-06, "loss": 1.2506, "step": 6886 }, { "epoch": 0.21, "learning_rate": 4.5982890540745575e-06, "loss": 1.1734, "step": 6887 }, { "epoch": 0.21, "learning_rate": 4.5981564383070994e-06, "loss": 1.1413, "step": 6888 }, { "epoch": 0.21, "learning_rate": 4.598023802566203e-06, "loss": 1.2546, "step": 6889 }, { "epoch": 0.21, "learning_rate": 4.597891146853129e-06, "loss": 1.1342, "step": 6890 }, { "epoch": 0.21, "learning_rate": 4.597758471169143e-06, "loss": 1.1249, "step": 6891 }, { "epoch": 0.21, "learning_rate": 4.597625775515507e-06, "loss": 1.0865, "step": 6892 }, { "epoch": 0.21, "learning_rate": 4.597493059893483e-06, "loss": 1.1318, "step": 6893 }, { "epoch": 0.21, "learning_rate": 4.5973603243043354e-06, "loss": 1.0582, "step": 6894 }, { "epoch": 0.21, "learning_rate": 4.5972275687493275e-06, "loss": 1.1522, "step": 6895 }, { "epoch": 0.21, "learning_rate": 4.5970947932297234e-06, "loss": 1.0773, "step": 6896 }, { "epoch": 0.21, "learning_rate": 4.596961997746787e-06, "loss": 1.098, "step": 6897 }, { "epoch": 0.21, "learning_rate": 4.596829182301782e-06, "loss": 1.2234, "step": 6898 }, { "epoch": 0.21, "learning_rate": 4.596696346895973e-06, "loss": 1.2892, "step": 6899 }, { "epoch": 0.21, "learning_rate": 4.596563491530625e-06, "loss": 1.1631, "step": 6900 }, { "epoch": 0.21, "learning_rate": 4.596430616207002e-06, "loss": 1.1129, "step": 6901 }, { "epoch": 0.21, "learning_rate": 4.596297720926369e-06, "loss": 1.1336, "step": 6902 }, { "epoch": 0.21, "learning_rate": 4.596164805689992e-06, "loss": 1.1698, "step": 6903 }, { "epoch": 0.21, "learning_rate": 4.596031870499135e-06, "loss": 1.0833, "step": 6904 }, { "epoch": 0.21, "learning_rate": 4.595898915355063e-06, "loss": 1.2063, "step": 6905 }, { "epoch": 0.21, "learning_rate": 4.5957659402590445e-06, "loss": 1.1445, "step": 6906 }, { "epoch": 0.21, "learning_rate": 4.595632945212344e-06, "loss": 1.1257, "step": 6907 }, { "epoch": 0.21, "learning_rate": 4.595499930216225e-06, "loss": 1.0881, "step": 6908 }, { "epoch": 0.21, "learning_rate": 4.595366895271958e-06, "loss": 1.1647, "step": 6909 }, { "epoch": 0.21, "learning_rate": 4.595233840380806e-06, "loss": 1.2117, "step": 6910 }, { "epoch": 0.21, "learning_rate": 4.595100765544038e-06, "loss": 1.1699, "step": 6911 }, { "epoch": 0.21, "learning_rate": 4.594967670762919e-06, "loss": 1.0435, "step": 6912 }, { "epoch": 0.21, "learning_rate": 4.594834556038717e-06, "loss": 1.2332, "step": 6913 }, { "epoch": 0.21, "learning_rate": 4.594701421372699e-06, "loss": 1.1821, "step": 6914 }, { "epoch": 0.21, "learning_rate": 4.594568266766132e-06, "loss": 1.219, "step": 6915 }, { "epoch": 0.21, "learning_rate": 4.594435092220284e-06, "loss": 1.1984, "step": 6916 }, { "epoch": 0.21, "learning_rate": 4.594301897736422e-06, "loss": 1.1536, "step": 6917 }, { "epoch": 0.21, "learning_rate": 4.594168683315815e-06, "loss": 1.2084, "step": 6918 }, { "epoch": 0.21, "learning_rate": 4.594035448959732e-06, "loss": 1.1611, "step": 6919 }, { "epoch": 0.21, "learning_rate": 4.593902194669438e-06, "loss": 1.0168, "step": 6920 }, { "epoch": 0.21, "learning_rate": 4.593768920446205e-06, "loss": 1.1395, "step": 6921 }, { "epoch": 0.21, "learning_rate": 4.5936356262912995e-06, "loss": 1.2681, "step": 6922 }, { "epoch": 0.21, "learning_rate": 4.593502312205992e-06, "loss": 1.079, "step": 6923 }, { "epoch": 0.21, "learning_rate": 4.59336897819155e-06, "loss": 1.1248, "step": 6924 }, { "epoch": 0.21, "learning_rate": 4.593235624249244e-06, "loss": 1.0909, "step": 6925 }, { "epoch": 0.21, "learning_rate": 4.593102250380343e-06, "loss": 1.2071, "step": 6926 }, { "epoch": 0.21, "learning_rate": 4.592968856586117e-06, "loss": 1.1368, "step": 6927 }, { "epoch": 0.21, "learning_rate": 4.592835442867834e-06, "loss": 1.1932, "step": 6928 }, { "epoch": 0.21, "learning_rate": 4.592702009226767e-06, "loss": 1.108, "step": 6929 }, { "epoch": 0.21, "learning_rate": 4.592568555664183e-06, "loss": 1.1785, "step": 6930 }, { "epoch": 0.21, "learning_rate": 4.592435082181356e-06, "loss": 1.1804, "step": 6931 }, { "epoch": 0.21, "learning_rate": 4.592301588779554e-06, "loss": 1.1296, "step": 6932 }, { "epoch": 0.21, "learning_rate": 4.592168075460049e-06, "loss": 1.1477, "step": 6933 }, { "epoch": 0.21, "learning_rate": 4.592034542224112e-06, "loss": 1.0563, "step": 6934 }, { "epoch": 0.21, "learning_rate": 4.591900989073012e-06, "loss": 1.3455, "step": 6935 }, { "epoch": 0.21, "learning_rate": 4.5917674160080224e-06, "loss": 1.286, "step": 6936 }, { "epoch": 0.21, "learning_rate": 4.591633823030416e-06, "loss": 1.2726, "step": 6937 }, { "epoch": 0.21, "learning_rate": 4.591500210141462e-06, "loss": 1.2103, "step": 6938 }, { "epoch": 0.21, "learning_rate": 4.591366577342433e-06, "loss": 1.1364, "step": 6939 }, { "epoch": 0.21, "learning_rate": 4.591232924634602e-06, "loss": 1.1345, "step": 6940 }, { "epoch": 0.21, "learning_rate": 4.5910992520192406e-06, "loss": 1.187, "step": 6941 }, { "epoch": 0.21, "learning_rate": 4.590965559497621e-06, "loss": 1.1286, "step": 6942 }, { "epoch": 0.21, "learning_rate": 4.590831847071017e-06, "loss": 1.1589, "step": 6943 }, { "epoch": 0.21, "learning_rate": 4.5906981147407e-06, "loss": 1.2111, "step": 6944 }, { "epoch": 0.21, "learning_rate": 4.590564362507944e-06, "loss": 1.0958, "step": 6945 }, { "epoch": 0.21, "learning_rate": 4.590430590374023e-06, "loss": 1.1509, "step": 6946 }, { "epoch": 0.21, "learning_rate": 4.5902967983402095e-06, "loss": 1.0274, "step": 6947 }, { "epoch": 0.21, "learning_rate": 4.590162986407776e-06, "loss": 1.2146, "step": 6948 }, { "epoch": 0.21, "learning_rate": 4.590029154577998e-06, "loss": 1.1598, "step": 6949 }, { "epoch": 0.21, "learning_rate": 4.58989530285215e-06, "loss": 1.1733, "step": 6950 }, { "epoch": 0.21, "learning_rate": 4.589761431231504e-06, "loss": 1.08, "step": 6951 }, { "epoch": 0.21, "learning_rate": 4.589627539717336e-06, "loss": 1.1011, "step": 6952 }, { "epoch": 0.21, "learning_rate": 4.58949362831092e-06, "loss": 1.0713, "step": 6953 }, { "epoch": 0.21, "learning_rate": 4.589359697013532e-06, "loss": 1.1114, "step": 6954 }, { "epoch": 0.21, "learning_rate": 4.589225745826445e-06, "loss": 1.1815, "step": 6955 }, { "epoch": 0.21, "learning_rate": 4.589091774750935e-06, "loss": 1.1456, "step": 6956 }, { "epoch": 0.21, "learning_rate": 4.588957783788278e-06, "loss": 1.2479, "step": 6957 }, { "epoch": 0.21, "learning_rate": 4.588823772939749e-06, "loss": 1.1597, "step": 6958 }, { "epoch": 0.21, "learning_rate": 4.588689742206624e-06, "loss": 1.0959, "step": 6959 }, { "epoch": 0.21, "learning_rate": 4.588555691590178e-06, "loss": 1.1526, "step": 6960 }, { "epoch": 0.21, "learning_rate": 4.5884216210916875e-06, "loss": 1.1982, "step": 6961 }, { "epoch": 0.21, "learning_rate": 4.588287530712429e-06, "loss": 1.0609, "step": 6962 }, { "epoch": 0.21, "learning_rate": 4.588153420453679e-06, "loss": 1.1369, "step": 6963 }, { "epoch": 0.21, "learning_rate": 4.588019290316715e-06, "loss": 1.1987, "step": 6964 }, { "epoch": 0.21, "learning_rate": 4.587885140302812e-06, "loss": 0.9916, "step": 6965 }, { "epoch": 0.21, "learning_rate": 4.587750970413249e-06, "loss": 1.0257, "step": 6966 }, { "epoch": 0.21, "learning_rate": 4.587616780649302e-06, "loss": 1.1688, "step": 6967 }, { "epoch": 0.21, "learning_rate": 4.587482571012248e-06, "loss": 1.2108, "step": 6968 }, { "epoch": 0.21, "learning_rate": 4.5873483415033654e-06, "loss": 1.0898, "step": 6969 }, { "epoch": 0.21, "learning_rate": 4.587214092123932e-06, "loss": 1.0698, "step": 6970 }, { "epoch": 0.21, "learning_rate": 4.587079822875226e-06, "loss": 1.0752, "step": 6971 }, { "epoch": 0.21, "learning_rate": 4.586945533758525e-06, "loss": 1.2004, "step": 6972 }, { "epoch": 0.21, "learning_rate": 4.586811224775107e-06, "loss": 1.2524, "step": 6973 }, { "epoch": 0.21, "learning_rate": 4.586676895926253e-06, "loss": 1.2266, "step": 6974 }, { "epoch": 0.21, "learning_rate": 4.586542547213238e-06, "loss": 1.1, "step": 6975 }, { "epoch": 0.21, "learning_rate": 4.586408178637344e-06, "loss": 1.1616, "step": 6976 }, { "epoch": 0.21, "learning_rate": 4.5862737901998486e-06, "loss": 1.1777, "step": 6977 }, { "epoch": 0.21, "learning_rate": 4.586139381902031e-06, "loss": 1.1569, "step": 6978 }, { "epoch": 0.21, "learning_rate": 4.5860049537451724e-06, "loss": 1.0767, "step": 6979 }, { "epoch": 0.21, "learning_rate": 4.585870505730551e-06, "loss": 1.1969, "step": 6980 }, { "epoch": 0.21, "learning_rate": 4.585736037859446e-06, "loss": 1.0548, "step": 6981 }, { "epoch": 0.21, "learning_rate": 4.585601550133139e-06, "loss": 1.2145, "step": 6982 }, { "epoch": 0.21, "learning_rate": 4.585467042552909e-06, "loss": 1.1945, "step": 6983 }, { "epoch": 0.21, "learning_rate": 4.585332515120039e-06, "loss": 1.0917, "step": 6984 }, { "epoch": 0.21, "learning_rate": 4.585197967835806e-06, "loss": 1.0983, "step": 6985 }, { "epoch": 0.21, "learning_rate": 4.585063400701494e-06, "loss": 1.0893, "step": 6986 }, { "epoch": 0.21, "learning_rate": 4.5849288137183815e-06, "loss": 1.2091, "step": 6987 }, { "epoch": 0.21, "learning_rate": 4.584794206887752e-06, "loss": 1.1747, "step": 6988 }, { "epoch": 0.21, "learning_rate": 4.584659580210884e-06, "loss": 1.0798, "step": 6989 }, { "epoch": 0.21, "learning_rate": 4.584524933689062e-06, "loss": 1.0912, "step": 6990 }, { "epoch": 0.21, "learning_rate": 4.584390267323567e-06, "loss": 1.0226, "step": 6991 }, { "epoch": 0.21, "learning_rate": 4.584255581115679e-06, "loss": 1.0294, "step": 6992 }, { "epoch": 0.21, "learning_rate": 4.584120875066683e-06, "loss": 1.2596, "step": 6993 }, { "epoch": 0.21, "learning_rate": 4.58398614917786e-06, "loss": 1.1785, "step": 6994 }, { "epoch": 0.21, "learning_rate": 4.583851403450492e-06, "loss": 1.1519, "step": 6995 }, { "epoch": 0.21, "learning_rate": 4.5837166378858626e-06, "loss": 1.1972, "step": 6996 }, { "epoch": 0.21, "learning_rate": 4.583581852485254e-06, "loss": 1.2296, "step": 6997 }, { "epoch": 0.21, "learning_rate": 4.583447047249949e-06, "loss": 1.2289, "step": 6998 }, { "epoch": 0.21, "learning_rate": 4.583312222181233e-06, "loss": 1.1908, "step": 6999 }, { "epoch": 0.21, "learning_rate": 4.583177377280387e-06, "loss": 1.2566, "step": 7000 }, { "epoch": 0.21, "learning_rate": 4.583042512548697e-06, "loss": 1.0394, "step": 7001 }, { "epoch": 0.21, "learning_rate": 4.582907627987444e-06, "loss": 1.1917, "step": 7002 }, { "epoch": 0.21, "learning_rate": 4.582772723597914e-06, "loss": 1.0591, "step": 7003 }, { "epoch": 0.21, "learning_rate": 4.5826377993813905e-06, "loss": 1.1523, "step": 7004 }, { "epoch": 0.21, "learning_rate": 4.582502855339158e-06, "loss": 1.157, "step": 7005 }, { "epoch": 0.21, "learning_rate": 4.582367891472502e-06, "loss": 1.1429, "step": 7006 }, { "epoch": 0.21, "learning_rate": 4.582232907782707e-06, "loss": 1.1132, "step": 7007 }, { "epoch": 0.21, "learning_rate": 4.582097904271057e-06, "loss": 1.2357, "step": 7008 }, { "epoch": 0.21, "learning_rate": 4.581962880938837e-06, "loss": 1.148, "step": 7009 }, { "epoch": 0.21, "learning_rate": 4.581827837787334e-06, "loss": 1.174, "step": 7010 }, { "epoch": 0.21, "learning_rate": 4.581692774817832e-06, "loss": 1.1299, "step": 7011 }, { "epoch": 0.21, "learning_rate": 4.581557692031618e-06, "loss": 1.1422, "step": 7012 }, { "epoch": 0.21, "learning_rate": 4.581422589429977e-06, "loss": 1.1245, "step": 7013 }, { "epoch": 0.21, "learning_rate": 4.5812874670141955e-06, "loss": 1.1161, "step": 7014 }, { "epoch": 0.21, "learning_rate": 4.581152324785559e-06, "loss": 1.1815, "step": 7015 }, { "epoch": 0.21, "learning_rate": 4.581017162745356e-06, "loss": 1.1634, "step": 7016 }, { "epoch": 0.21, "learning_rate": 4.580881980894872e-06, "loss": 1.1254, "step": 7017 }, { "epoch": 0.21, "learning_rate": 4.580746779235392e-06, "loss": 1.2823, "step": 7018 }, { "epoch": 0.21, "learning_rate": 4.580611557768206e-06, "loss": 1.1447, "step": 7019 }, { "epoch": 0.21, "learning_rate": 4.580476316494599e-06, "loss": 1.0311, "step": 7020 }, { "epoch": 0.21, "learning_rate": 4.58034105541586e-06, "loss": 1.2114, "step": 7021 }, { "epoch": 0.21, "learning_rate": 4.5802057745332765e-06, "loss": 1.1229, "step": 7022 }, { "epoch": 0.21, "learning_rate": 4.580070473848135e-06, "loss": 1.1299, "step": 7023 }, { "epoch": 0.21, "learning_rate": 4.579935153361725e-06, "loss": 1.1317, "step": 7024 }, { "epoch": 0.21, "learning_rate": 4.579799813075335e-06, "loss": 1.1465, "step": 7025 }, { "epoch": 0.21, "learning_rate": 4.579664452990252e-06, "loss": 1.1667, "step": 7026 }, { "epoch": 0.21, "learning_rate": 4.579529073107764e-06, "loss": 1.1727, "step": 7027 }, { "epoch": 0.21, "learning_rate": 4.579393673429161e-06, "loss": 1.1462, "step": 7028 }, { "epoch": 0.21, "learning_rate": 4.579258253955731e-06, "loss": 1.0958, "step": 7029 }, { "epoch": 0.21, "learning_rate": 4.5791228146887656e-06, "loss": 1.12, "step": 7030 }, { "epoch": 0.21, "learning_rate": 4.578987355629552e-06, "loss": 1.2008, "step": 7031 }, { "epoch": 0.21, "learning_rate": 4.5788518767793786e-06, "loss": 1.0227, "step": 7032 }, { "epoch": 0.21, "learning_rate": 4.578716378139538e-06, "loss": 1.1498, "step": 7033 }, { "epoch": 0.21, "learning_rate": 4.578580859711318e-06, "loss": 0.985, "step": 7034 }, { "epoch": 0.21, "learning_rate": 4.57844532149601e-06, "loss": 1.1329, "step": 7035 }, { "epoch": 0.21, "learning_rate": 4.5783097634949025e-06, "loss": 1.1768, "step": 7036 }, { "epoch": 0.21, "learning_rate": 4.578174185709288e-06, "loss": 1.2235, "step": 7037 }, { "epoch": 0.21, "learning_rate": 4.578038588140456e-06, "loss": 1.1591, "step": 7038 }, { "epoch": 0.21, "learning_rate": 4.577902970789696e-06, "loss": 1.2642, "step": 7039 }, { "epoch": 0.21, "learning_rate": 4.577767333658302e-06, "loss": 1.0752, "step": 7040 }, { "epoch": 0.21, "learning_rate": 4.5776316767475635e-06, "loss": 1.1949, "step": 7041 }, { "epoch": 0.21, "learning_rate": 4.577496000058771e-06, "loss": 1.2086, "step": 7042 }, { "epoch": 0.21, "learning_rate": 4.577360303593219e-06, "loss": 1.0393, "step": 7043 }, { "epoch": 0.21, "learning_rate": 4.577224587352196e-06, "loss": 1.0892, "step": 7044 }, { "epoch": 0.21, "learning_rate": 4.5770888513369955e-06, "loss": 1.149, "step": 7045 }, { "epoch": 0.21, "learning_rate": 4.57695309554891e-06, "loss": 1.2264, "step": 7046 }, { "epoch": 0.21, "learning_rate": 4.576817319989231e-06, "loss": 1.1279, "step": 7047 }, { "epoch": 0.21, "learning_rate": 4.576681524659251e-06, "loss": 1.0409, "step": 7048 }, { "epoch": 0.21, "learning_rate": 4.576545709560264e-06, "loss": 1.1503, "step": 7049 }, { "epoch": 0.21, "learning_rate": 4.576409874693561e-06, "loss": 1.1589, "step": 7050 }, { "epoch": 0.21, "learning_rate": 4.576274020060436e-06, "loss": 1.1164, "step": 7051 }, { "epoch": 0.21, "learning_rate": 4.576138145662183e-06, "loss": 1.1345, "step": 7052 }, { "epoch": 0.21, "learning_rate": 4.576002251500095e-06, "loss": 1.1198, "step": 7053 }, { "epoch": 0.21, "learning_rate": 4.575866337575464e-06, "loss": 1.066, "step": 7054 }, { "epoch": 0.21, "learning_rate": 4.575730403889586e-06, "loss": 1.0543, "step": 7055 }, { "epoch": 0.21, "learning_rate": 4.5755944504437545e-06, "loss": 1.1301, "step": 7056 }, { "epoch": 0.21, "learning_rate": 4.575458477239263e-06, "loss": 1.0657, "step": 7057 }, { "epoch": 0.21, "learning_rate": 4.5753224842774066e-06, "loss": 1.1651, "step": 7058 }, { "epoch": 0.21, "learning_rate": 4.57518647155948e-06, "loss": 1.1147, "step": 7059 }, { "epoch": 0.21, "learning_rate": 4.575050439086778e-06, "loss": 1.1327, "step": 7060 }, { "epoch": 0.21, "learning_rate": 4.574914386860594e-06, "loss": 1.1474, "step": 7061 }, { "epoch": 0.21, "learning_rate": 4.574778314882225e-06, "loss": 1.1183, "step": 7062 }, { "epoch": 0.21, "learning_rate": 4.5746422231529654e-06, "loss": 1.2057, "step": 7063 }, { "epoch": 0.21, "learning_rate": 4.574506111674111e-06, "loss": 1.1055, "step": 7064 }, { "epoch": 0.21, "learning_rate": 4.574369980446958e-06, "loss": 0.9849, "step": 7065 }, { "epoch": 0.21, "learning_rate": 4.574233829472802e-06, "loss": 1.156, "step": 7066 }, { "epoch": 0.21, "learning_rate": 4.574097658752938e-06, "loss": 1.078, "step": 7067 }, { "epoch": 0.21, "learning_rate": 4.573961468288664e-06, "loss": 1.1691, "step": 7068 }, { "epoch": 0.21, "learning_rate": 4.5738252580812754e-06, "loss": 1.197, "step": 7069 }, { "epoch": 0.21, "learning_rate": 4.573689028132069e-06, "loss": 1.1755, "step": 7070 }, { "epoch": 0.21, "learning_rate": 4.573552778442342e-06, "loss": 1.1833, "step": 7071 }, { "epoch": 0.21, "learning_rate": 4.5734165090133905e-06, "loss": 0.9973, "step": 7072 }, { "epoch": 0.21, "learning_rate": 4.573280219846514e-06, "loss": 1.1624, "step": 7073 }, { "epoch": 0.21, "learning_rate": 4.5731439109430074e-06, "loss": 1.2397, "step": 7074 }, { "epoch": 0.21, "learning_rate": 4.5730075823041685e-06, "loss": 1.0654, "step": 7075 }, { "epoch": 0.21, "learning_rate": 4.572871233931297e-06, "loss": 1.1193, "step": 7076 }, { "epoch": 0.21, "learning_rate": 4.572734865825689e-06, "loss": 1.202, "step": 7077 }, { "epoch": 0.21, "learning_rate": 4.572598477988644e-06, "loss": 1.0618, "step": 7078 }, { "epoch": 0.21, "learning_rate": 4.572462070421459e-06, "loss": 1.1824, "step": 7079 }, { "epoch": 0.21, "learning_rate": 4.572325643125433e-06, "loss": 1.2244, "step": 7080 }, { "epoch": 0.21, "learning_rate": 4.572189196101865e-06, "loss": 1.0788, "step": 7081 }, { "epoch": 0.21, "learning_rate": 4.572052729352055e-06, "loss": 1.1685, "step": 7082 }, { "epoch": 0.21, "learning_rate": 4.5719162428773005e-06, "loss": 1.175, "step": 7083 }, { "epoch": 0.21, "learning_rate": 4.5717797366789005e-06, "loss": 1.112, "step": 7084 }, { "epoch": 0.21, "learning_rate": 4.571643210758156e-06, "loss": 1.1193, "step": 7085 }, { "epoch": 0.21, "learning_rate": 4.5715066651163655e-06, "loss": 1.0555, "step": 7086 }, { "epoch": 0.21, "learning_rate": 4.571370099754829e-06, "loss": 1.1805, "step": 7087 }, { "epoch": 0.21, "learning_rate": 4.571233514674846e-06, "loss": 1.147, "step": 7088 }, { "epoch": 0.21, "learning_rate": 4.571096909877719e-06, "loss": 1.0204, "step": 7089 }, { "epoch": 0.21, "learning_rate": 4.5709602853647466e-06, "loss": 1.1893, "step": 7090 }, { "epoch": 0.21, "learning_rate": 4.5708236411372295e-06, "loss": 1.0517, "step": 7091 }, { "epoch": 0.21, "learning_rate": 4.570686977196468e-06, "loss": 1.1141, "step": 7092 }, { "epoch": 0.21, "learning_rate": 4.570550293543765e-06, "loss": 1.209, "step": 7093 }, { "epoch": 0.21, "learning_rate": 4.5704135901804196e-06, "loss": 1.1737, "step": 7094 }, { "epoch": 0.21, "learning_rate": 4.570276867107734e-06, "loss": 1.2625, "step": 7095 }, { "epoch": 0.21, "learning_rate": 4.5701401243270106e-06, "loss": 1.0331, "step": 7096 }, { "epoch": 0.21, "learning_rate": 4.570003361839549e-06, "loss": 1.2637, "step": 7097 }, { "epoch": 0.21, "learning_rate": 4.569866579646654e-06, "loss": 1.1418, "step": 7098 }, { "epoch": 0.21, "learning_rate": 4.569729777749624e-06, "loss": 1.2286, "step": 7099 }, { "epoch": 0.21, "learning_rate": 4.5695929561497644e-06, "loss": 1.1063, "step": 7100 }, { "epoch": 0.21, "learning_rate": 4.569456114848376e-06, "loss": 1.1829, "step": 7101 }, { "epoch": 0.21, "learning_rate": 4.569319253846763e-06, "loss": 1.1119, "step": 7102 }, { "epoch": 0.21, "learning_rate": 4.569182373146226e-06, "loss": 1.0613, "step": 7103 }, { "epoch": 0.21, "learning_rate": 4.56904547274807e-06, "loss": 1.3307, "step": 7104 }, { "epoch": 0.21, "learning_rate": 4.568908552653598e-06, "loss": 1.2074, "step": 7105 }, { "epoch": 0.21, "learning_rate": 4.5687716128641135e-06, "loss": 1.2242, "step": 7106 }, { "epoch": 0.21, "learning_rate": 4.568634653380919e-06, "loss": 1.1298, "step": 7107 }, { "epoch": 0.21, "learning_rate": 4.5684976742053185e-06, "loss": 1.1349, "step": 7108 }, { "epoch": 0.21, "learning_rate": 4.568360675338617e-06, "loss": 1.0401, "step": 7109 }, { "epoch": 0.21, "learning_rate": 4.568223656782117e-06, "loss": 1.1708, "step": 7110 }, { "epoch": 0.21, "learning_rate": 4.568086618537125e-06, "loss": 1.1875, "step": 7111 }, { "epoch": 0.21, "learning_rate": 4.567949560604944e-06, "loss": 1.0665, "step": 7112 }, { "epoch": 0.21, "learning_rate": 4.567812482986879e-06, "loss": 1.0731, "step": 7113 }, { "epoch": 0.21, "learning_rate": 4.567675385684235e-06, "loss": 1.2393, "step": 7114 }, { "epoch": 0.21, "learning_rate": 4.567538268698317e-06, "loss": 1.1445, "step": 7115 }, { "epoch": 0.21, "learning_rate": 4.567401132030431e-06, "loss": 1.2617, "step": 7116 }, { "epoch": 0.21, "learning_rate": 4.567263975681882e-06, "loss": 1.2302, "step": 7117 }, { "epoch": 0.21, "learning_rate": 4.567126799653975e-06, "loss": 1.2515, "step": 7118 }, { "epoch": 0.21, "learning_rate": 4.566989603948016e-06, "loss": 1.2134, "step": 7119 }, { "epoch": 0.21, "learning_rate": 4.566852388565312e-06, "loss": 1.1607, "step": 7120 }, { "epoch": 0.21, "learning_rate": 4.5667151535071695e-06, "loss": 1.1301, "step": 7121 }, { "epoch": 0.21, "learning_rate": 4.566577898774893e-06, "loss": 1.1207, "step": 7122 }, { "epoch": 0.21, "learning_rate": 4.566440624369791e-06, "loss": 1.1646, "step": 7123 }, { "epoch": 0.21, "learning_rate": 4.566303330293169e-06, "loss": 1.1885, "step": 7124 }, { "epoch": 0.21, "learning_rate": 4.566166016546335e-06, "loss": 1.049, "step": 7125 }, { "epoch": 0.21, "learning_rate": 4.566028683130595e-06, "loss": 1.2237, "step": 7126 }, { "epoch": 0.21, "learning_rate": 4.565891330047257e-06, "loss": 1.0841, "step": 7127 }, { "epoch": 0.21, "learning_rate": 4.565753957297628e-06, "loss": 1.1285, "step": 7128 }, { "epoch": 0.21, "learning_rate": 4.565616564883018e-06, "loss": 1.2174, "step": 7129 }, { "epoch": 0.21, "learning_rate": 4.565479152804732e-06, "loss": 1.1568, "step": 7130 }, { "epoch": 0.21, "learning_rate": 4.565341721064079e-06, "loss": 1.1951, "step": 7131 }, { "epoch": 0.21, "learning_rate": 4.565204269662368e-06, "loss": 1.101, "step": 7132 }, { "epoch": 0.21, "learning_rate": 4.565066798600907e-06, "loss": 1.2166, "step": 7133 }, { "epoch": 0.21, "learning_rate": 4.564929307881004e-06, "loss": 1.0893, "step": 7134 }, { "epoch": 0.21, "learning_rate": 4.564791797503969e-06, "loss": 1.1962, "step": 7135 }, { "epoch": 0.21, "learning_rate": 4.56465426747111e-06, "loss": 1.2383, "step": 7136 }, { "epoch": 0.22, "learning_rate": 4.564516717783738e-06, "loss": 1.1902, "step": 7137 }, { "epoch": 0.22, "learning_rate": 4.56437914844316e-06, "loss": 1.1916, "step": 7138 }, { "epoch": 0.22, "learning_rate": 4.5642415594506875e-06, "loss": 1.1262, "step": 7139 }, { "epoch": 0.22, "learning_rate": 4.564103950807628e-06, "loss": 0.9864, "step": 7140 }, { "epoch": 0.22, "learning_rate": 4.5639663225152945e-06, "loss": 1.1564, "step": 7141 }, { "epoch": 0.22, "learning_rate": 4.5638286745749955e-06, "loss": 1.1643, "step": 7142 }, { "epoch": 0.22, "learning_rate": 4.563691006988042e-06, "loss": 1.3605, "step": 7143 }, { "epoch": 0.22, "learning_rate": 4.563553319755743e-06, "loss": 1.2145, "step": 7144 }, { "epoch": 0.22, "learning_rate": 4.56341561287941e-06, "loss": 1.1264, "step": 7145 }, { "epoch": 0.22, "learning_rate": 4.5632778863603545e-06, "loss": 1.0044, "step": 7146 }, { "epoch": 0.22, "learning_rate": 4.563140140199888e-06, "loss": 1.153, "step": 7147 }, { "epoch": 0.22, "learning_rate": 4.56300237439932e-06, "loss": 1.1601, "step": 7148 }, { "epoch": 0.22, "learning_rate": 4.5628645889599635e-06, "loss": 1.1686, "step": 7149 }, { "epoch": 0.22, "learning_rate": 4.562726783883129e-06, "loss": 1.2634, "step": 7150 }, { "epoch": 0.22, "learning_rate": 4.56258895917013e-06, "loss": 1.1641, "step": 7151 }, { "epoch": 0.22, "learning_rate": 4.562451114822277e-06, "loss": 1.1035, "step": 7152 }, { "epoch": 0.22, "learning_rate": 4.5623132508408826e-06, "loss": 1.1152, "step": 7153 }, { "epoch": 0.22, "learning_rate": 4.562175367227259e-06, "loss": 1.2822, "step": 7154 }, { "epoch": 0.22, "learning_rate": 4.562037463982719e-06, "loss": 1.2496, "step": 7155 }, { "epoch": 0.22, "learning_rate": 4.561899541108576e-06, "loss": 1.2036, "step": 7156 }, { "epoch": 0.22, "learning_rate": 4.561761598606143e-06, "loss": 1.1077, "step": 7157 }, { "epoch": 0.22, "learning_rate": 4.561623636476732e-06, "loss": 1.2079, "step": 7158 }, { "epoch": 0.22, "learning_rate": 4.561485654721656e-06, "loss": 1.1909, "step": 7159 }, { "epoch": 0.22, "learning_rate": 4.561347653342231e-06, "loss": 1.1213, "step": 7160 }, { "epoch": 0.22, "learning_rate": 4.561209632339768e-06, "loss": 1.2359, "step": 7161 }, { "epoch": 0.22, "learning_rate": 4.561071591715582e-06, "loss": 1.184, "step": 7162 }, { "epoch": 0.22, "learning_rate": 4.560933531470987e-06, "loss": 1.2416, "step": 7163 }, { "epoch": 0.22, "learning_rate": 4.560795451607298e-06, "loss": 1.1219, "step": 7164 }, { "epoch": 0.22, "learning_rate": 4.560657352125828e-06, "loss": 1.23, "step": 7165 }, { "epoch": 0.22, "learning_rate": 4.560519233027893e-06, "loss": 1.1633, "step": 7166 }, { "epoch": 0.22, "learning_rate": 4.560381094314807e-06, "loss": 1.2129, "step": 7167 }, { "epoch": 0.22, "learning_rate": 4.5602429359878865e-06, "loss": 1.1394, "step": 7168 }, { "epoch": 0.22, "learning_rate": 4.560104758048444e-06, "loss": 1.2101, "step": 7169 }, { "epoch": 0.22, "learning_rate": 4.559966560497797e-06, "loss": 1.1985, "step": 7170 }, { "epoch": 0.22, "learning_rate": 4.5598283433372605e-06, "loss": 1.1494, "step": 7171 }, { "epoch": 0.22, "learning_rate": 4.559690106568151e-06, "loss": 1.1707, "step": 7172 }, { "epoch": 0.22, "learning_rate": 4.559551850191783e-06, "loss": 1.1063, "step": 7173 }, { "epoch": 0.22, "learning_rate": 4.559413574209472e-06, "loss": 1.2478, "step": 7174 }, { "epoch": 0.22, "learning_rate": 4.559275278622537e-06, "loss": 1.0784, "step": 7175 }, { "epoch": 0.22, "learning_rate": 4.559136963432292e-06, "loss": 1.1321, "step": 7176 }, { "epoch": 0.22, "learning_rate": 4.558998628640057e-06, "loss": 1.1165, "step": 7177 }, { "epoch": 0.22, "learning_rate": 4.558860274247145e-06, "loss": 1.107, "step": 7178 }, { "epoch": 0.22, "learning_rate": 4.558721900254875e-06, "loss": 1.051, "step": 7179 }, { "epoch": 0.22, "learning_rate": 4.558583506664564e-06, "loss": 1.205, "step": 7180 }, { "epoch": 0.22, "learning_rate": 4.5584450934775295e-06, "loss": 1.0922, "step": 7181 }, { "epoch": 0.22, "learning_rate": 4.55830666069509e-06, "loss": 1.2334, "step": 7182 }, { "epoch": 0.22, "learning_rate": 4.558168208318561e-06, "loss": 1.0901, "step": 7183 }, { "epoch": 0.22, "learning_rate": 4.558029736349263e-06, "loss": 1.0823, "step": 7184 }, { "epoch": 0.22, "learning_rate": 4.557891244788512e-06, "loss": 1.1379, "step": 7185 }, { "epoch": 0.22, "learning_rate": 4.557752733637628e-06, "loss": 1.26, "step": 7186 }, { "epoch": 0.22, "learning_rate": 4.55761420289793e-06, "loss": 1.1077, "step": 7187 }, { "epoch": 0.22, "learning_rate": 4.557475652570734e-06, "loss": 1.0761, "step": 7188 }, { "epoch": 0.22, "learning_rate": 4.557337082657361e-06, "loss": 1.1455, "step": 7189 }, { "epoch": 0.22, "learning_rate": 4.557198493159132e-06, "loss": 1.0837, "step": 7190 }, { "epoch": 0.22, "learning_rate": 4.557059884077362e-06, "loss": 1.2288, "step": 7191 }, { "epoch": 0.22, "learning_rate": 4.556921255413373e-06, "loss": 1.2021, "step": 7192 }, { "epoch": 0.22, "learning_rate": 4.5567826071684844e-06, "loss": 1.1152, "step": 7193 }, { "epoch": 0.22, "learning_rate": 4.556643939344016e-06, "loss": 1.2323, "step": 7194 }, { "epoch": 0.22, "learning_rate": 4.556505251941287e-06, "loss": 1.1535, "step": 7195 }, { "epoch": 0.22, "learning_rate": 4.55636654496162e-06, "loss": 1.1361, "step": 7196 }, { "epoch": 0.22, "learning_rate": 4.556227818406333e-06, "loss": 1.1457, "step": 7197 }, { "epoch": 0.22, "learning_rate": 4.556089072276748e-06, "loss": 1.1626, "step": 7198 }, { "epoch": 0.22, "learning_rate": 4.555950306574185e-06, "loss": 1.2203, "step": 7199 }, { "epoch": 0.22, "learning_rate": 4.555811521299965e-06, "loss": 1.2722, "step": 7200 }, { "epoch": 0.22, "learning_rate": 4.555672716455409e-06, "loss": 1.1461, "step": 7201 }, { "epoch": 0.22, "learning_rate": 4.55553389204184e-06, "loss": 1.0963, "step": 7202 }, { "epoch": 0.22, "learning_rate": 4.555395048060578e-06, "loss": 1.0645, "step": 7203 }, { "epoch": 0.22, "learning_rate": 4.555256184512944e-06, "loss": 1.1747, "step": 7204 }, { "epoch": 0.22, "learning_rate": 4.555117301400262e-06, "loss": 1.1062, "step": 7205 }, { "epoch": 0.22, "learning_rate": 4.5549783987238525e-06, "loss": 1.1953, "step": 7206 }, { "epoch": 0.22, "learning_rate": 4.554839476485039e-06, "loss": 1.1086, "step": 7207 }, { "epoch": 0.22, "learning_rate": 4.554700534685143e-06, "loss": 1.0746, "step": 7208 }, { "epoch": 0.22, "learning_rate": 4.5545615733254875e-06, "loss": 1.11, "step": 7209 }, { "epoch": 0.22, "learning_rate": 4.554422592407395e-06, "loss": 1.0872, "step": 7210 }, { "epoch": 0.22, "learning_rate": 4.5542835919321894e-06, "loss": 1.2233, "step": 7211 }, { "epoch": 0.22, "learning_rate": 4.554144571901193e-06, "loss": 1.2457, "step": 7212 }, { "epoch": 0.22, "learning_rate": 4.554005532315729e-06, "loss": 1.0643, "step": 7213 }, { "epoch": 0.22, "learning_rate": 4.5538664731771234e-06, "loss": 1.0759, "step": 7214 }, { "epoch": 0.22, "learning_rate": 4.553727394486697e-06, "loss": 1.2444, "step": 7215 }, { "epoch": 0.22, "learning_rate": 4.553588296245775e-06, "loss": 1.2189, "step": 7216 }, { "epoch": 0.22, "learning_rate": 4.5534491784556815e-06, "loss": 1.201, "step": 7217 }, { "epoch": 0.22, "learning_rate": 4.5533100411177405e-06, "loss": 1.0563, "step": 7218 }, { "epoch": 0.22, "learning_rate": 4.553170884233277e-06, "loss": 1.1754, "step": 7219 }, { "epoch": 0.22, "learning_rate": 4.553031707803616e-06, "loss": 1.1019, "step": 7220 }, { "epoch": 0.22, "learning_rate": 4.552892511830081e-06, "loss": 1.1072, "step": 7221 }, { "epoch": 0.22, "learning_rate": 4.552753296313998e-06, "loss": 1.1859, "step": 7222 }, { "epoch": 0.22, "learning_rate": 4.552614061256693e-06, "loss": 1.1624, "step": 7223 }, { "epoch": 0.22, "learning_rate": 4.55247480665949e-06, "loss": 1.1705, "step": 7224 }, { "epoch": 0.22, "learning_rate": 4.552335532523716e-06, "loss": 1.0805, "step": 7225 }, { "epoch": 0.22, "learning_rate": 4.552196238850696e-06, "loss": 1.1627, "step": 7226 }, { "epoch": 0.22, "learning_rate": 4.5520569256417566e-06, "loss": 1.2104, "step": 7227 }, { "epoch": 0.22, "learning_rate": 4.551917592898223e-06, "loss": 1.1777, "step": 7228 }, { "epoch": 0.22, "learning_rate": 4.551778240621422e-06, "loss": 1.1783, "step": 7229 }, { "epoch": 0.22, "learning_rate": 4.551638868812681e-06, "loss": 1.1509, "step": 7230 }, { "epoch": 0.22, "learning_rate": 4.5514994774733255e-06, "loss": 1.3157, "step": 7231 }, { "epoch": 0.22, "learning_rate": 4.551360066604683e-06, "loss": 1.1525, "step": 7232 }, { "epoch": 0.22, "learning_rate": 4.551220636208081e-06, "loss": 1.0916, "step": 7233 }, { "epoch": 0.22, "learning_rate": 4.551081186284847e-06, "loss": 1.1195, "step": 7234 }, { "epoch": 0.22, "learning_rate": 4.550941716836306e-06, "loss": 1.2406, "step": 7235 }, { "epoch": 0.22, "learning_rate": 4.550802227863788e-06, "loss": 1.2299, "step": 7236 }, { "epoch": 0.22, "learning_rate": 4.550662719368622e-06, "loss": 1.0419, "step": 7237 }, { "epoch": 0.22, "learning_rate": 4.550523191352134e-06, "loss": 1.0684, "step": 7238 }, { "epoch": 0.22, "learning_rate": 4.550383643815653e-06, "loss": 1.1151, "step": 7239 }, { "epoch": 0.22, "learning_rate": 4.550244076760507e-06, "loss": 1.0557, "step": 7240 }, { "epoch": 0.22, "learning_rate": 4.550104490188024e-06, "loss": 1.1562, "step": 7241 }, { "epoch": 0.22, "learning_rate": 4.5499648840995346e-06, "loss": 1.2594, "step": 7242 }, { "epoch": 0.22, "learning_rate": 4.549825258496366e-06, "loss": 1.1762, "step": 7243 }, { "epoch": 0.22, "learning_rate": 4.5496856133798494e-06, "loss": 1.2548, "step": 7244 }, { "epoch": 0.22, "learning_rate": 4.549545948751312e-06, "loss": 1.1442, "step": 7245 }, { "epoch": 0.22, "learning_rate": 4.5494062646120845e-06, "loss": 1.2076, "step": 7246 }, { "epoch": 0.22, "learning_rate": 4.549266560963497e-06, "loss": 1.0754, "step": 7247 }, { "epoch": 0.22, "learning_rate": 4.549126837806878e-06, "loss": 1.1815, "step": 7248 }, { "epoch": 0.22, "learning_rate": 4.548987095143558e-06, "loss": 1.1144, "step": 7249 }, { "epoch": 0.22, "learning_rate": 4.5488473329748686e-06, "loss": 1.1133, "step": 7250 }, { "epoch": 0.22, "learning_rate": 4.5487075513021385e-06, "loss": 1.0976, "step": 7251 }, { "epoch": 0.22, "learning_rate": 4.548567750126699e-06, "loss": 1.0555, "step": 7252 }, { "epoch": 0.22, "learning_rate": 4.548427929449882e-06, "loss": 1.0805, "step": 7253 }, { "epoch": 0.22, "learning_rate": 4.548288089273018e-06, "loss": 1.158, "step": 7254 }, { "epoch": 0.22, "learning_rate": 4.548148229597437e-06, "loss": 1.2196, "step": 7255 }, { "epoch": 0.22, "learning_rate": 4.548008350424472e-06, "loss": 1.2257, "step": 7256 }, { "epoch": 0.22, "learning_rate": 4.5478684517554536e-06, "loss": 1.0798, "step": 7257 }, { "epoch": 0.22, "learning_rate": 4.547728533591713e-06, "loss": 1.0659, "step": 7258 }, { "epoch": 0.22, "learning_rate": 4.5475885959345845e-06, "loss": 1.1605, "step": 7259 }, { "epoch": 0.22, "learning_rate": 4.547448638785398e-06, "loss": 1.1611, "step": 7260 }, { "epoch": 0.22, "learning_rate": 4.547308662145486e-06, "loss": 1.2012, "step": 7261 }, { "epoch": 0.22, "learning_rate": 4.547168666016182e-06, "loss": 1.3, "step": 7262 }, { "epoch": 0.22, "learning_rate": 4.547028650398818e-06, "loss": 1.1627, "step": 7263 }, { "epoch": 0.22, "learning_rate": 4.546888615294728e-06, "loss": 1.1221, "step": 7264 }, { "epoch": 0.22, "learning_rate": 4.546748560705243e-06, "loss": 1.0696, "step": 7265 }, { "epoch": 0.22, "learning_rate": 4.546608486631698e-06, "loss": 1.0871, "step": 7266 }, { "epoch": 0.22, "learning_rate": 4.546468393075426e-06, "loss": 1.1196, "step": 7267 }, { "epoch": 0.22, "learning_rate": 4.546328280037761e-06, "loss": 1.1524, "step": 7268 }, { "epoch": 0.22, "learning_rate": 4.546188147520035e-06, "loss": 1.166, "step": 7269 }, { "epoch": 0.22, "learning_rate": 4.546047995523584e-06, "loss": 1.0015, "step": 7270 }, { "epoch": 0.22, "learning_rate": 4.5459078240497416e-06, "loss": 1.1092, "step": 7271 }, { "epoch": 0.22, "learning_rate": 4.545767633099843e-06, "loss": 1.1268, "step": 7272 }, { "epoch": 0.22, "learning_rate": 4.54562742267522e-06, "loss": 1.1426, "step": 7273 }, { "epoch": 0.22, "learning_rate": 4.54548719277721e-06, "loss": 1.2057, "step": 7274 }, { "epoch": 0.22, "learning_rate": 4.545346943407148e-06, "loss": 1.1622, "step": 7275 }, { "epoch": 0.22, "learning_rate": 4.545206674566366e-06, "loss": 1.1655, "step": 7276 }, { "epoch": 0.22, "learning_rate": 4.545066386256203e-06, "loss": 1.1622, "step": 7277 }, { "epoch": 0.22, "learning_rate": 4.544926078477993e-06, "loss": 1.1016, "step": 7278 }, { "epoch": 0.22, "learning_rate": 4.544785751233071e-06, "loss": 1.276, "step": 7279 }, { "epoch": 0.22, "learning_rate": 4.544645404522773e-06, "loss": 1.2865, "step": 7280 }, { "epoch": 0.22, "learning_rate": 4.5445050383484365e-06, "loss": 1.2736, "step": 7281 }, { "epoch": 0.22, "learning_rate": 4.544364652711396e-06, "loss": 1.1566, "step": 7282 }, { "epoch": 0.22, "learning_rate": 4.544224247612989e-06, "loss": 1.1534, "step": 7283 }, { "epoch": 0.22, "learning_rate": 4.544083823054552e-06, "loss": 1.2037, "step": 7284 }, { "epoch": 0.22, "learning_rate": 4.543943379037421e-06, "loss": 1.1824, "step": 7285 }, { "epoch": 0.22, "learning_rate": 4.543802915562934e-06, "loss": 1.1625, "step": 7286 }, { "epoch": 0.22, "learning_rate": 4.5436624326324265e-06, "loss": 1.2208, "step": 7287 }, { "epoch": 0.22, "learning_rate": 4.543521930247237e-06, "loss": 1.0106, "step": 7288 }, { "epoch": 0.22, "learning_rate": 4.543381408408704e-06, "loss": 1.1486, "step": 7289 }, { "epoch": 0.22, "learning_rate": 4.543240867118164e-06, "loss": 1.0827, "step": 7290 }, { "epoch": 0.22, "learning_rate": 4.543100306376954e-06, "loss": 1.1819, "step": 7291 }, { "epoch": 0.22, "learning_rate": 4.5429597261864135e-06, "loss": 1.2017, "step": 7292 }, { "epoch": 0.22, "learning_rate": 4.5428191265478805e-06, "loss": 1.3162, "step": 7293 }, { "epoch": 0.22, "learning_rate": 4.542678507462693e-06, "loss": 1.1752, "step": 7294 }, { "epoch": 0.22, "learning_rate": 4.542537868932191e-06, "loss": 1.186, "step": 7295 }, { "epoch": 0.22, "learning_rate": 4.542397210957711e-06, "loss": 1.1982, "step": 7296 }, { "epoch": 0.22, "learning_rate": 4.542256533540594e-06, "loss": 1.0609, "step": 7297 }, { "epoch": 0.22, "learning_rate": 4.542115836682177e-06, "loss": 1.2584, "step": 7298 }, { "epoch": 0.22, "learning_rate": 4.541975120383803e-06, "loss": 1.3094, "step": 7299 }, { "epoch": 0.22, "learning_rate": 4.5418343846468076e-06, "loss": 1.146, "step": 7300 }, { "epoch": 0.22, "learning_rate": 4.541693629472532e-06, "loss": 1.0342, "step": 7301 }, { "epoch": 0.22, "learning_rate": 4.541552854862317e-06, "loss": 1.0256, "step": 7302 }, { "epoch": 0.22, "learning_rate": 4.541412060817502e-06, "loss": 1.175, "step": 7303 }, { "epoch": 0.22, "learning_rate": 4.541271247339428e-06, "loss": 1.1192, "step": 7304 }, { "epoch": 0.22, "learning_rate": 4.541130414429434e-06, "loss": 1.1479, "step": 7305 }, { "epoch": 0.22, "learning_rate": 4.540989562088861e-06, "loss": 1.2076, "step": 7306 }, { "epoch": 0.22, "learning_rate": 4.540848690319052e-06, "loss": 1.0611, "step": 7307 }, { "epoch": 0.22, "learning_rate": 4.5407077991213455e-06, "loss": 1.0609, "step": 7308 }, { "epoch": 0.22, "learning_rate": 4.540566888497083e-06, "loss": 1.1371, "step": 7309 }, { "epoch": 0.22, "learning_rate": 4.540425958447607e-06, "loss": 1.1115, "step": 7310 }, { "epoch": 0.22, "learning_rate": 4.540285008974259e-06, "loss": 1.1973, "step": 7311 }, { "epoch": 0.22, "learning_rate": 4.54014404007838e-06, "loss": 1.1588, "step": 7312 }, { "epoch": 0.22, "learning_rate": 4.540003051761312e-06, "loss": 1.2568, "step": 7313 }, { "epoch": 0.22, "learning_rate": 4.539862044024398e-06, "loss": 1.1546, "step": 7314 }, { "epoch": 0.22, "learning_rate": 4.5397210168689795e-06, "loss": 1.1782, "step": 7315 }, { "epoch": 0.22, "learning_rate": 4.539579970296399e-06, "loss": 1.1844, "step": 7316 }, { "epoch": 0.22, "learning_rate": 4.5394389043080004e-06, "loss": 1.22, "step": 7317 }, { "epoch": 0.22, "learning_rate": 4.539297818905124e-06, "loss": 1.2021, "step": 7318 }, { "epoch": 0.22, "learning_rate": 4.5391567140891155e-06, "loss": 1.1196, "step": 7319 }, { "epoch": 0.22, "learning_rate": 4.539015589861318e-06, "loss": 1.1156, "step": 7320 }, { "epoch": 0.22, "learning_rate": 4.538874446223073e-06, "loss": 1.1896, "step": 7321 }, { "epoch": 0.22, "learning_rate": 4.5387332831757254e-06, "loss": 1.1238, "step": 7322 }, { "epoch": 0.22, "learning_rate": 4.538592100720619e-06, "loss": 1.1065, "step": 7323 }, { "epoch": 0.22, "learning_rate": 4.5384508988590975e-06, "loss": 1.1287, "step": 7324 }, { "epoch": 0.22, "learning_rate": 4.538309677592505e-06, "loss": 1.1084, "step": 7325 }, { "epoch": 0.22, "learning_rate": 4.538168436922187e-06, "loss": 0.9809, "step": 7326 }, { "epoch": 0.22, "learning_rate": 4.538027176849487e-06, "loss": 1.108, "step": 7327 }, { "epoch": 0.22, "learning_rate": 4.537885897375749e-06, "loss": 1.1664, "step": 7328 }, { "epoch": 0.22, "learning_rate": 4.5377445985023185e-06, "loss": 1.1522, "step": 7329 }, { "epoch": 0.22, "learning_rate": 4.537603280230542e-06, "loss": 1.272, "step": 7330 }, { "epoch": 0.22, "learning_rate": 4.537461942561762e-06, "loss": 1.12, "step": 7331 }, { "epoch": 0.22, "learning_rate": 4.537320585497327e-06, "loss": 1.0946, "step": 7332 }, { "epoch": 0.22, "learning_rate": 4.5371792090385805e-06, "loss": 1.1329, "step": 7333 }, { "epoch": 0.22, "learning_rate": 4.53703781318687e-06, "loss": 1.1012, "step": 7334 }, { "epoch": 0.22, "learning_rate": 4.53689639794354e-06, "loss": 1.1056, "step": 7335 }, { "epoch": 0.22, "learning_rate": 4.536754963309937e-06, "loss": 1.0726, "step": 7336 }, { "epoch": 0.22, "learning_rate": 4.536613509287407e-06, "loss": 1.2129, "step": 7337 }, { "epoch": 0.22, "learning_rate": 4.536472035877298e-06, "loss": 1.1987, "step": 7338 }, { "epoch": 0.22, "learning_rate": 4.5363305430809565e-06, "loss": 1.1017, "step": 7339 }, { "epoch": 0.22, "learning_rate": 4.5361890308997295e-06, "loss": 1.182, "step": 7340 }, { "epoch": 0.22, "learning_rate": 4.5360474993349625e-06, "loss": 1.1692, "step": 7341 }, { "epoch": 0.22, "learning_rate": 4.535905948388004e-06, "loss": 1.0915, "step": 7342 }, { "epoch": 0.22, "learning_rate": 4.535764378060201e-06, "loss": 1.2443, "step": 7343 }, { "epoch": 0.22, "learning_rate": 4.535622788352902e-06, "loss": 1.0411, "step": 7344 }, { "epoch": 0.22, "learning_rate": 4.5354811792674545e-06, "loss": 1.1406, "step": 7345 }, { "epoch": 0.22, "learning_rate": 4.535339550805207e-06, "loss": 1.1108, "step": 7346 }, { "epoch": 0.22, "learning_rate": 4.535197902967506e-06, "loss": 1.0869, "step": 7347 }, { "epoch": 0.22, "learning_rate": 4.535056235755703e-06, "loss": 1.0566, "step": 7348 }, { "epoch": 0.22, "learning_rate": 4.5349145491711436e-06, "loss": 1.1481, "step": 7349 }, { "epoch": 0.22, "learning_rate": 4.534772843215178e-06, "loss": 1.1918, "step": 7350 }, { "epoch": 0.22, "learning_rate": 4.534631117889154e-06, "loss": 1.1287, "step": 7351 }, { "epoch": 0.22, "learning_rate": 4.534489373194423e-06, "loss": 1.0646, "step": 7352 }, { "epoch": 0.22, "learning_rate": 4.534347609132332e-06, "loss": 1.1409, "step": 7353 }, { "epoch": 0.22, "learning_rate": 4.534205825704232e-06, "loss": 1.1708, "step": 7354 }, { "epoch": 0.22, "learning_rate": 4.5340640229114715e-06, "loss": 1.2567, "step": 7355 }, { "epoch": 0.22, "learning_rate": 4.533922200755403e-06, "loss": 1.1818, "step": 7356 }, { "epoch": 0.22, "learning_rate": 4.533780359237373e-06, "loss": 1.0815, "step": 7357 }, { "epoch": 0.22, "learning_rate": 4.533638498358734e-06, "loss": 1.147, "step": 7358 }, { "epoch": 0.22, "learning_rate": 4.533496618120836e-06, "loss": 1.1263, "step": 7359 }, { "epoch": 0.22, "learning_rate": 4.533354718525029e-06, "loss": 1.1705, "step": 7360 }, { "epoch": 0.22, "learning_rate": 4.533212799572666e-06, "loss": 1.2018, "step": 7361 }, { "epoch": 0.22, "learning_rate": 4.533070861265095e-06, "loss": 1.1476, "step": 7362 }, { "epoch": 0.22, "learning_rate": 4.532928903603668e-06, "loss": 1.1458, "step": 7363 }, { "epoch": 0.22, "learning_rate": 4.5327869265897385e-06, "loss": 1.2256, "step": 7364 }, { "epoch": 0.22, "learning_rate": 4.532644930224656e-06, "loss": 1.105, "step": 7365 }, { "epoch": 0.22, "learning_rate": 4.532502914509772e-06, "loss": 1.053, "step": 7366 }, { "epoch": 0.22, "learning_rate": 4.53236087944644e-06, "loss": 1.2971, "step": 7367 }, { "epoch": 0.22, "learning_rate": 4.53221882503601e-06, "loss": 1.3905, "step": 7368 }, { "epoch": 0.22, "learning_rate": 4.532076751279837e-06, "loss": 1.1563, "step": 7369 }, { "epoch": 0.22, "learning_rate": 4.531934658179271e-06, "loss": 1.1879, "step": 7370 }, { "epoch": 0.22, "learning_rate": 4.531792545735667e-06, "loss": 1.0984, "step": 7371 }, { "epoch": 0.22, "learning_rate": 4.531650413950375e-06, "loss": 1.1737, "step": 7372 }, { "epoch": 0.22, "learning_rate": 4.5315082628247495e-06, "loss": 1.2487, "step": 7373 }, { "epoch": 0.22, "learning_rate": 4.531366092360145e-06, "loss": 1.1202, "step": 7374 }, { "epoch": 0.22, "learning_rate": 4.531223902557913e-06, "loss": 1.136, "step": 7375 }, { "epoch": 0.22, "learning_rate": 4.531081693419408e-06, "loss": 1.1937, "step": 7376 }, { "epoch": 0.22, "learning_rate": 4.530939464945983e-06, "loss": 1.0874, "step": 7377 }, { "epoch": 0.22, "learning_rate": 4.5307972171389925e-06, "loss": 1.1557, "step": 7378 }, { "epoch": 0.22, "learning_rate": 4.530654949999791e-06, "loss": 1.0769, "step": 7379 }, { "epoch": 0.22, "learning_rate": 4.530512663529732e-06, "loss": 1.1334, "step": 7380 }, { "epoch": 0.22, "learning_rate": 4.53037035773017e-06, "loss": 1.1017, "step": 7381 }, { "epoch": 0.22, "learning_rate": 4.530228032602461e-06, "loss": 1.2406, "step": 7382 }, { "epoch": 0.22, "learning_rate": 4.530085688147958e-06, "loss": 1.1112, "step": 7383 }, { "epoch": 0.22, "learning_rate": 4.529943324368018e-06, "loss": 1.0766, "step": 7384 }, { "epoch": 0.22, "learning_rate": 4.529800941263994e-06, "loss": 1.1319, "step": 7385 }, { "epoch": 0.22, "learning_rate": 4.529658538837243e-06, "loss": 1.0692, "step": 7386 }, { "epoch": 0.22, "learning_rate": 4.529516117089121e-06, "loss": 1.2361, "step": 7387 }, { "epoch": 0.22, "learning_rate": 4.529373676020982e-06, "loss": 1.1062, "step": 7388 }, { "epoch": 0.22, "learning_rate": 4.529231215634183e-06, "loss": 1.2086, "step": 7389 }, { "epoch": 0.22, "learning_rate": 4.529088735930081e-06, "loss": 1.0651, "step": 7390 }, { "epoch": 0.22, "learning_rate": 4.528946236910031e-06, "loss": 1.1638, "step": 7391 }, { "epoch": 0.22, "learning_rate": 4.52880371857539e-06, "loss": 1.2653, "step": 7392 }, { "epoch": 0.22, "learning_rate": 4.528661180927515e-06, "loss": 0.9892, "step": 7393 }, { "epoch": 0.22, "learning_rate": 4.5285186239677625e-06, "loss": 1.0499, "step": 7394 }, { "epoch": 0.22, "learning_rate": 4.528376047697489e-06, "loss": 1.1569, "step": 7395 }, { "epoch": 0.22, "learning_rate": 4.5282334521180534e-06, "loss": 1.099, "step": 7396 }, { "epoch": 0.22, "learning_rate": 4.528090837230812e-06, "loss": 1.1897, "step": 7397 }, { "epoch": 0.22, "learning_rate": 4.527948203037122e-06, "loss": 1.1088, "step": 7398 }, { "epoch": 0.22, "learning_rate": 4.527805549538343e-06, "loss": 1.1896, "step": 7399 }, { "epoch": 0.22, "learning_rate": 4.52766287673583e-06, "loss": 1.2898, "step": 7400 }, { "epoch": 0.22, "learning_rate": 4.527520184630944e-06, "loss": 1.111, "step": 7401 }, { "epoch": 0.22, "learning_rate": 4.527377473225042e-06, "loss": 0.9574, "step": 7402 }, { "epoch": 0.22, "learning_rate": 4.527234742519483e-06, "loss": 1.2298, "step": 7403 }, { "epoch": 0.22, "learning_rate": 4.527091992515625e-06, "loss": 1.2787, "step": 7404 }, { "epoch": 0.22, "learning_rate": 4.526949223214829e-06, "loss": 1.1545, "step": 7405 }, { "epoch": 0.22, "learning_rate": 4.526806434618452e-06, "loss": 1.2998, "step": 7406 }, { "epoch": 0.22, "learning_rate": 4.526663626727853e-06, "loss": 1.127, "step": 7407 }, { "epoch": 0.22, "learning_rate": 4.5265207995443935e-06, "loss": 1.0761, "step": 7408 }, { "epoch": 0.22, "learning_rate": 4.526377953069432e-06, "loss": 1.1735, "step": 7409 }, { "epoch": 0.22, "learning_rate": 4.526235087304327e-06, "loss": 1.068, "step": 7410 }, { "epoch": 0.22, "learning_rate": 4.526092202250441e-06, "loss": 1.0234, "step": 7411 }, { "epoch": 0.22, "learning_rate": 4.525949297909132e-06, "loss": 1.2395, "step": 7412 }, { "epoch": 0.22, "learning_rate": 4.5258063742817625e-06, "loss": 1.07, "step": 7413 }, { "epoch": 0.22, "learning_rate": 4.5256634313696915e-06, "loss": 1.147, "step": 7414 }, { "epoch": 0.22, "learning_rate": 4.52552046917428e-06, "loss": 1.1031, "step": 7415 }, { "epoch": 0.22, "learning_rate": 4.5253774876968905e-06, "loss": 1.132, "step": 7416 }, { "epoch": 0.22, "learning_rate": 4.525234486938881e-06, "loss": 1.2599, "step": 7417 }, { "epoch": 0.22, "learning_rate": 4.525091466901615e-06, "loss": 1.2117, "step": 7418 }, { "epoch": 0.22, "learning_rate": 4.524948427586454e-06, "loss": 1.0938, "step": 7419 }, { "epoch": 0.22, "learning_rate": 4.52480536899476e-06, "loss": 1.1113, "step": 7420 }, { "epoch": 0.22, "learning_rate": 4.524662291127892e-06, "loss": 1.098, "step": 7421 }, { "epoch": 0.22, "learning_rate": 4.524519193987215e-06, "loss": 1.0061, "step": 7422 }, { "epoch": 0.22, "learning_rate": 4.524376077574092e-06, "loss": 1.1456, "step": 7423 }, { "epoch": 0.22, "learning_rate": 4.5242329418898816e-06, "loss": 1.1642, "step": 7424 }, { "epoch": 0.22, "learning_rate": 4.52408978693595e-06, "loss": 1.2206, "step": 7425 }, { "epoch": 0.22, "learning_rate": 4.5239466127136576e-06, "loss": 1.0943, "step": 7426 }, { "epoch": 0.22, "learning_rate": 4.523803419224368e-06, "loss": 1.2423, "step": 7427 }, { "epoch": 0.22, "learning_rate": 4.5236602064694446e-06, "loss": 1.1542, "step": 7428 }, { "epoch": 0.22, "learning_rate": 4.5235169744502505e-06, "loss": 1.225, "step": 7429 }, { "epoch": 0.22, "learning_rate": 4.52337372316815e-06, "loss": 1.2388, "step": 7430 }, { "epoch": 0.22, "learning_rate": 4.5232304526245065e-06, "loss": 1.041, "step": 7431 }, { "epoch": 0.22, "learning_rate": 4.523087162820682e-06, "loss": 1.0942, "step": 7432 }, { "epoch": 0.22, "learning_rate": 4.522943853758044e-06, "loss": 1.1461, "step": 7433 }, { "epoch": 0.22, "learning_rate": 4.522800525437953e-06, "loss": 1.1868, "step": 7434 }, { "epoch": 0.22, "learning_rate": 4.5226571778617755e-06, "loss": 1.2327, "step": 7435 }, { "epoch": 0.22, "learning_rate": 4.522513811030877e-06, "loss": 1.1857, "step": 7436 }, { "epoch": 0.22, "learning_rate": 4.522370424946621e-06, "loss": 1.1082, "step": 7437 }, { "epoch": 0.22, "learning_rate": 4.5222270196103715e-06, "loss": 1.0386, "step": 7438 }, { "epoch": 0.22, "learning_rate": 4.522083595023495e-06, "loss": 1.1154, "step": 7439 }, { "epoch": 0.22, "learning_rate": 4.521940151187356e-06, "loss": 1.0502, "step": 7440 }, { "epoch": 0.22, "learning_rate": 4.521796688103321e-06, "loss": 1.2194, "step": 7441 }, { "epoch": 0.22, "learning_rate": 4.5216532057727564e-06, "loss": 1.0879, "step": 7442 }, { "epoch": 0.22, "learning_rate": 4.521509704197026e-06, "loss": 1.0914, "step": 7443 }, { "epoch": 0.22, "learning_rate": 4.521366183377497e-06, "loss": 1.1417, "step": 7444 }, { "epoch": 0.22, "learning_rate": 4.521222643315535e-06, "loss": 1.1689, "step": 7445 }, { "epoch": 0.22, "learning_rate": 4.521079084012507e-06, "loss": 1.1313, "step": 7446 }, { "epoch": 0.22, "learning_rate": 4.52093550546978e-06, "loss": 1.0848, "step": 7447 }, { "epoch": 0.22, "learning_rate": 4.5207919076887195e-06, "loss": 1.1973, "step": 7448 }, { "epoch": 0.22, "learning_rate": 4.520648290670694e-06, "loss": 1.3463, "step": 7449 }, { "epoch": 0.22, "learning_rate": 4.52050465441707e-06, "loss": 1.0508, "step": 7450 }, { "epoch": 0.22, "learning_rate": 4.520360998929215e-06, "loss": 1.0932, "step": 7451 }, { "epoch": 0.22, "learning_rate": 4.5202173242084956e-06, "loss": 1.1338, "step": 7452 }, { "epoch": 0.22, "learning_rate": 4.520073630256281e-06, "loss": 1.0635, "step": 7453 }, { "epoch": 0.22, "learning_rate": 4.519929917073937e-06, "loss": 1.1199, "step": 7454 }, { "epoch": 0.22, "learning_rate": 4.519786184662834e-06, "loss": 1.2295, "step": 7455 }, { "epoch": 0.22, "learning_rate": 4.5196424330243395e-06, "loss": 1.0961, "step": 7456 }, { "epoch": 0.22, "learning_rate": 4.519498662159822e-06, "loss": 1.1172, "step": 7457 }, { "epoch": 0.22, "learning_rate": 4.5193548720706486e-06, "loss": 1.1494, "step": 7458 }, { "epoch": 0.22, "learning_rate": 4.51921106275819e-06, "loss": 1.0649, "step": 7459 }, { "epoch": 0.22, "learning_rate": 4.519067234223815e-06, "loss": 1.1188, "step": 7460 }, { "epoch": 0.22, "learning_rate": 4.518923386468891e-06, "loss": 1.1302, "step": 7461 }, { "epoch": 0.22, "learning_rate": 4.518779519494791e-06, "loss": 1.1596, "step": 7462 }, { "epoch": 0.22, "learning_rate": 4.5186356333028806e-06, "loss": 1.1259, "step": 7463 }, { "epoch": 0.22, "learning_rate": 4.5184917278945305e-06, "loss": 1.151, "step": 7464 }, { "epoch": 0.22, "learning_rate": 4.518347803271113e-06, "loss": 1.0501, "step": 7465 }, { "epoch": 0.22, "learning_rate": 4.518203859433996e-06, "loss": 1.1553, "step": 7466 }, { "epoch": 0.22, "learning_rate": 4.51805989638455e-06, "loss": 1.1721, "step": 7467 }, { "epoch": 0.22, "learning_rate": 4.517915914124145e-06, "loss": 1.1813, "step": 7468 }, { "epoch": 0.23, "learning_rate": 4.517771912654153e-06, "loss": 1.1461, "step": 7469 }, { "epoch": 0.23, "learning_rate": 4.517627891975945e-06, "loss": 1.1256, "step": 7470 }, { "epoch": 0.23, "learning_rate": 4.517483852090891e-06, "loss": 1.1556, "step": 7471 }, { "epoch": 0.23, "learning_rate": 4.517339793000361e-06, "loss": 1.131, "step": 7472 }, { "epoch": 0.23, "learning_rate": 4.517195714705728e-06, "loss": 1.2159, "step": 7473 }, { "epoch": 0.23, "learning_rate": 4.517051617208365e-06, "loss": 1.2264, "step": 7474 }, { "epoch": 0.23, "learning_rate": 4.516907500509641e-06, "loss": 1.3211, "step": 7475 }, { "epoch": 0.23, "learning_rate": 4.516763364610929e-06, "loss": 1.1399, "step": 7476 }, { "epoch": 0.23, "learning_rate": 4.5166192095136e-06, "loss": 1.1653, "step": 7477 }, { "epoch": 0.23, "learning_rate": 4.516475035219029e-06, "loss": 1.0685, "step": 7478 }, { "epoch": 0.23, "learning_rate": 4.516330841728585e-06, "loss": 1.1016, "step": 7479 }, { "epoch": 0.23, "learning_rate": 4.516186629043645e-06, "loss": 1.1709, "step": 7480 }, { "epoch": 0.23, "learning_rate": 4.516042397165577e-06, "loss": 1.2007, "step": 7481 }, { "epoch": 0.23, "learning_rate": 4.515898146095758e-06, "loss": 1.2156, "step": 7482 }, { "epoch": 0.23, "learning_rate": 4.515753875835559e-06, "loss": 1.1807, "step": 7483 }, { "epoch": 0.23, "learning_rate": 4.515609586386354e-06, "loss": 1.1263, "step": 7484 }, { "epoch": 0.23, "learning_rate": 4.515465277749516e-06, "loss": 1.1174, "step": 7485 }, { "epoch": 0.23, "learning_rate": 4.51532094992642e-06, "loss": 1.2465, "step": 7486 }, { "epoch": 0.23, "learning_rate": 4.515176602918439e-06, "loss": 1.0689, "step": 7487 }, { "epoch": 0.23, "learning_rate": 4.515032236726946e-06, "loss": 1.1005, "step": 7488 }, { "epoch": 0.23, "learning_rate": 4.514887851353318e-06, "loss": 1.1141, "step": 7489 }, { "epoch": 0.23, "learning_rate": 4.514743446798927e-06, "loss": 1.1354, "step": 7490 }, { "epoch": 0.23, "learning_rate": 4.51459902306515e-06, "loss": 1.0775, "step": 7491 }, { "epoch": 0.23, "learning_rate": 4.51445458015336e-06, "loss": 1.0758, "step": 7492 }, { "epoch": 0.23, "learning_rate": 4.5143101180649325e-06, "loss": 1.1146, "step": 7493 }, { "epoch": 0.23, "learning_rate": 4.5141656368012425e-06, "loss": 1.1943, "step": 7494 }, { "epoch": 0.23, "learning_rate": 4.514021136363667e-06, "loss": 1.1109, "step": 7495 }, { "epoch": 0.23, "learning_rate": 4.513876616753579e-06, "loss": 1.1692, "step": 7496 }, { "epoch": 0.23, "learning_rate": 4.513732077972355e-06, "loss": 1.1118, "step": 7497 }, { "epoch": 0.23, "learning_rate": 4.513587520021372e-06, "loss": 1.0252, "step": 7498 }, { "epoch": 0.23, "learning_rate": 4.513442942902006e-06, "loss": 1.3154, "step": 7499 }, { "epoch": 0.23, "learning_rate": 4.513298346615633e-06, "loss": 1.0869, "step": 7500 }, { "epoch": 0.23, "learning_rate": 4.513153731163628e-06, "loss": 1.1031, "step": 7501 }, { "epoch": 0.23, "learning_rate": 4.513009096547372e-06, "loss": 1.072, "step": 7502 }, { "epoch": 0.23, "learning_rate": 4.512864442768236e-06, "loss": 1.1451, "step": 7503 }, { "epoch": 0.23, "learning_rate": 4.512719769827601e-06, "loss": 1.1941, "step": 7504 }, { "epoch": 0.23, "learning_rate": 4.512575077726843e-06, "loss": 1.2285, "step": 7505 }, { "epoch": 0.23, "learning_rate": 4.51243036646734e-06, "loss": 1.0479, "step": 7506 }, { "epoch": 0.23, "learning_rate": 4.512285636050469e-06, "loss": 1.1229, "step": 7507 }, { "epoch": 0.23, "learning_rate": 4.512140886477608e-06, "loss": 1.1266, "step": 7508 }, { "epoch": 0.23, "learning_rate": 4.5119961177501344e-06, "loss": 1.0493, "step": 7509 }, { "epoch": 0.23, "learning_rate": 4.511851329869427e-06, "loss": 1.1524, "step": 7510 }, { "epoch": 0.23, "learning_rate": 4.5117065228368636e-06, "loss": 1.2069, "step": 7511 }, { "epoch": 0.23, "learning_rate": 4.511561696653823e-06, "loss": 1.1716, "step": 7512 }, { "epoch": 0.23, "learning_rate": 4.511416851321684e-06, "loss": 1.0744, "step": 7513 }, { "epoch": 0.23, "learning_rate": 4.5112719868418255e-06, "loss": 1.1403, "step": 7514 }, { "epoch": 0.23, "learning_rate": 4.511127103215626e-06, "loss": 1.1344, "step": 7515 }, { "epoch": 0.23, "learning_rate": 4.510982200444466e-06, "loss": 1.0173, "step": 7516 }, { "epoch": 0.23, "learning_rate": 4.5108372785297225e-06, "loss": 1.2362, "step": 7517 }, { "epoch": 0.23, "learning_rate": 4.510692337472778e-06, "loss": 1.2161, "step": 7518 }, { "epoch": 0.23, "learning_rate": 4.51054737727501e-06, "loss": 1.077, "step": 7519 }, { "epoch": 0.23, "learning_rate": 4.510402397937799e-06, "loss": 1.2349, "step": 7520 }, { "epoch": 0.23, "learning_rate": 4.510257399462526e-06, "loss": 1.1344, "step": 7521 }, { "epoch": 0.23, "learning_rate": 4.51011238185057e-06, "loss": 1.1289, "step": 7522 }, { "epoch": 0.23, "learning_rate": 4.509967345103313e-06, "loss": 1.127, "step": 7523 }, { "epoch": 0.23, "learning_rate": 4.509822289222135e-06, "loss": 1.1956, "step": 7524 }, { "epoch": 0.23, "learning_rate": 4.509677214208417e-06, "loss": 1.1406, "step": 7525 }, { "epoch": 0.23, "learning_rate": 4.509532120063539e-06, "loss": 1.1014, "step": 7526 }, { "epoch": 0.23, "learning_rate": 4.5093870067888825e-06, "loss": 1.1449, "step": 7527 }, { "epoch": 0.23, "learning_rate": 4.50924187438583e-06, "loss": 0.9839, "step": 7528 }, { "epoch": 0.23, "learning_rate": 4.509096722855764e-06, "loss": 1.0293, "step": 7529 }, { "epoch": 0.23, "learning_rate": 4.508951552200062e-06, "loss": 1.2289, "step": 7530 }, { "epoch": 0.23, "learning_rate": 4.508806362420111e-06, "loss": 1.1104, "step": 7531 }, { "epoch": 0.23, "learning_rate": 4.508661153517291e-06, "loss": 1.0994, "step": 7532 }, { "epoch": 0.23, "learning_rate": 4.5085159254929835e-06, "loss": 1.2477, "step": 7533 }, { "epoch": 0.23, "learning_rate": 4.5083706783485715e-06, "loss": 1.1208, "step": 7534 }, { "epoch": 0.23, "learning_rate": 4.508225412085438e-06, "loss": 1.1889, "step": 7535 }, { "epoch": 0.23, "learning_rate": 4.508080126704965e-06, "loss": 1.259, "step": 7536 }, { "epoch": 0.23, "learning_rate": 4.507934822208539e-06, "loss": 1.1096, "step": 7537 }, { "epoch": 0.23, "learning_rate": 4.507789498597538e-06, "loss": 1.1837, "step": 7538 }, { "epoch": 0.23, "learning_rate": 4.507644155873349e-06, "loss": 1.1307, "step": 7539 }, { "epoch": 0.23, "learning_rate": 4.507498794037353e-06, "loss": 1.0648, "step": 7540 }, { "epoch": 0.23, "learning_rate": 4.507353413090937e-06, "loss": 1.1338, "step": 7541 }, { "epoch": 0.23, "learning_rate": 4.507208013035483e-06, "loss": 1.0932, "step": 7542 }, { "epoch": 0.23, "learning_rate": 4.507062593872376e-06, "loss": 1.135, "step": 7543 }, { "epoch": 0.23, "learning_rate": 4.506917155602999e-06, "loss": 1.226, "step": 7544 }, { "epoch": 0.23, "learning_rate": 4.506771698228737e-06, "loss": 1.2314, "step": 7545 }, { "epoch": 0.23, "learning_rate": 4.506626221750975e-06, "loss": 1.0586, "step": 7546 }, { "epoch": 0.23, "learning_rate": 4.506480726171099e-06, "loss": 1.1614, "step": 7547 }, { "epoch": 0.23, "learning_rate": 4.506335211490491e-06, "loss": 1.2179, "step": 7548 }, { "epoch": 0.23, "learning_rate": 4.506189677710539e-06, "loss": 1.2875, "step": 7549 }, { "epoch": 0.23, "learning_rate": 4.506044124832627e-06, "loss": 1.2845, "step": 7550 }, { "epoch": 0.23, "learning_rate": 4.505898552858142e-06, "loss": 1.1656, "step": 7551 }, { "epoch": 0.23, "learning_rate": 4.505752961788468e-06, "loss": 1.0878, "step": 7552 }, { "epoch": 0.23, "learning_rate": 4.505607351624992e-06, "loss": 1.2305, "step": 7553 }, { "epoch": 0.23, "learning_rate": 4.505461722369101e-06, "loss": 1.1385, "step": 7554 }, { "epoch": 0.23, "learning_rate": 4.505316074022179e-06, "loss": 1.1249, "step": 7555 }, { "epoch": 0.23, "learning_rate": 4.505170406585614e-06, "loss": 1.2129, "step": 7556 }, { "epoch": 0.23, "learning_rate": 4.505024720060792e-06, "loss": 1.1407, "step": 7557 }, { "epoch": 0.23, "learning_rate": 4.504879014449102e-06, "loss": 1.1073, "step": 7558 }, { "epoch": 0.23, "learning_rate": 4.504733289751928e-06, "loss": 1.0892, "step": 7559 }, { "epoch": 0.23, "learning_rate": 4.504587545970658e-06, "loss": 1.074, "step": 7560 }, { "epoch": 0.23, "learning_rate": 4.504441783106681e-06, "loss": 1.1899, "step": 7561 }, { "epoch": 0.23, "learning_rate": 4.504296001161384e-06, "loss": 1.2155, "step": 7562 }, { "epoch": 0.23, "learning_rate": 4.5041502001361535e-06, "loss": 1.1144, "step": 7563 }, { "epoch": 0.23, "learning_rate": 4.5040043800323785e-06, "loss": 1.1743, "step": 7564 }, { "epoch": 0.23, "learning_rate": 4.503858540851447e-06, "loss": 1.0877, "step": 7565 }, { "epoch": 0.23, "learning_rate": 4.503712682594747e-06, "loss": 1.2094, "step": 7566 }, { "epoch": 0.23, "learning_rate": 4.503566805263668e-06, "loss": 1.1913, "step": 7567 }, { "epoch": 0.23, "learning_rate": 4.503420908859598e-06, "loss": 1.092, "step": 7568 }, { "epoch": 0.23, "learning_rate": 4.503274993383926e-06, "loss": 1.2463, "step": 7569 }, { "epoch": 0.23, "learning_rate": 4.50312905883804e-06, "loss": 1.1041, "step": 7570 }, { "epoch": 0.23, "learning_rate": 4.50298310522333e-06, "loss": 1.092, "step": 7571 }, { "epoch": 0.23, "learning_rate": 4.502837132541186e-06, "loss": 1.2367, "step": 7572 }, { "epoch": 0.23, "learning_rate": 4.502691140792997e-06, "loss": 1.0789, "step": 7573 }, { "epoch": 0.23, "learning_rate": 4.502545129980154e-06, "loss": 1.1595, "step": 7574 }, { "epoch": 0.23, "learning_rate": 4.5023991001040444e-06, "loss": 0.9984, "step": 7575 }, { "epoch": 0.23, "learning_rate": 4.50225305116606e-06, "loss": 1.1343, "step": 7576 }, { "epoch": 0.23, "learning_rate": 4.5021069831675915e-06, "loss": 1.0511, "step": 7577 }, { "epoch": 0.23, "learning_rate": 4.501960896110028e-06, "loss": 1.1247, "step": 7578 }, { "epoch": 0.23, "learning_rate": 4.501814789994761e-06, "loss": 1.2029, "step": 7579 }, { "epoch": 0.23, "learning_rate": 4.501668664823181e-06, "loss": 1.1127, "step": 7580 }, { "epoch": 0.23, "learning_rate": 4.50152252059668e-06, "loss": 1.2445, "step": 7581 }, { "epoch": 0.23, "learning_rate": 4.501376357316648e-06, "loss": 1.1049, "step": 7582 }, { "epoch": 0.23, "learning_rate": 4.501230174984478e-06, "loss": 1.1365, "step": 7583 }, { "epoch": 0.23, "learning_rate": 4.50108397360156e-06, "loss": 1.1243, "step": 7584 }, { "epoch": 0.23, "learning_rate": 4.500937753169286e-06, "loss": 1.0838, "step": 7585 }, { "epoch": 0.23, "learning_rate": 4.500791513689049e-06, "loss": 1.0632, "step": 7586 }, { "epoch": 0.23, "learning_rate": 4.500645255162239e-06, "loss": 1.2172, "step": 7587 }, { "epoch": 0.23, "learning_rate": 4.500498977590251e-06, "loss": 1.0923, "step": 7588 }, { "epoch": 0.23, "learning_rate": 4.500352680974475e-06, "loss": 1.1256, "step": 7589 }, { "epoch": 0.23, "learning_rate": 4.500206365316307e-06, "loss": 1.0748, "step": 7590 }, { "epoch": 0.23, "learning_rate": 4.500060030617136e-06, "loss": 1.179, "step": 7591 }, { "epoch": 0.23, "learning_rate": 4.499913676878358e-06, "loss": 1.2172, "step": 7592 }, { "epoch": 0.23, "learning_rate": 4.499767304101363e-06, "loss": 1.2309, "step": 7593 }, { "epoch": 0.23, "learning_rate": 4.499620912287549e-06, "loss": 1.1612, "step": 7594 }, { "epoch": 0.23, "learning_rate": 4.499474501438304e-06, "loss": 1.1039, "step": 7595 }, { "epoch": 0.23, "learning_rate": 4.499328071555027e-06, "loss": 1.0854, "step": 7596 }, { "epoch": 0.23, "learning_rate": 4.49918162263911e-06, "loss": 1.1875, "step": 7597 }, { "epoch": 0.23, "learning_rate": 4.499035154691945e-06, "loss": 1.1433, "step": 7598 }, { "epoch": 0.23, "learning_rate": 4.498888667714929e-06, "loss": 1.2506, "step": 7599 }, { "epoch": 0.23, "learning_rate": 4.498742161709455e-06, "loss": 1.1154, "step": 7600 }, { "epoch": 0.23, "learning_rate": 4.498595636676919e-06, "loss": 1.004, "step": 7601 }, { "epoch": 0.23, "learning_rate": 4.498449092618715e-06, "loss": 1.1558, "step": 7602 }, { "epoch": 0.23, "learning_rate": 4.498302529536238e-06, "loss": 1.3079, "step": 7603 }, { "epoch": 0.23, "learning_rate": 4.498155947430883e-06, "loss": 1.2006, "step": 7604 }, { "epoch": 0.23, "learning_rate": 4.4980093463040465e-06, "loss": 1.2129, "step": 7605 }, { "epoch": 0.23, "learning_rate": 4.497862726157122e-06, "loss": 1.2667, "step": 7606 }, { "epoch": 0.23, "learning_rate": 4.497716086991507e-06, "loss": 1.1927, "step": 7607 }, { "epoch": 0.23, "learning_rate": 4.497569428808598e-06, "loss": 1.1018, "step": 7608 }, { "epoch": 0.23, "learning_rate": 4.497422751609789e-06, "loss": 1.11, "step": 7609 }, { "epoch": 0.23, "learning_rate": 4.497276055396478e-06, "loss": 1.066, "step": 7610 }, { "epoch": 0.23, "learning_rate": 4.497129340170061e-06, "loss": 1.2371, "step": 7611 }, { "epoch": 0.23, "learning_rate": 4.496982605931934e-06, "loss": 1.1635, "step": 7612 }, { "epoch": 0.23, "learning_rate": 4.4968358526834945e-06, "loss": 1.1011, "step": 7613 }, { "epoch": 0.23, "learning_rate": 4.49668908042614e-06, "loss": 1.1661, "step": 7614 }, { "epoch": 0.23, "learning_rate": 4.496542289161266e-06, "loss": 1.1351, "step": 7615 }, { "epoch": 0.23, "learning_rate": 4.496395478890272e-06, "loss": 1.1829, "step": 7616 }, { "epoch": 0.23, "learning_rate": 4.496248649614554e-06, "loss": 1.1938, "step": 7617 }, { "epoch": 0.23, "learning_rate": 4.496101801335511e-06, "loss": 1.1751, "step": 7618 }, { "epoch": 0.23, "learning_rate": 4.495954934054539e-06, "loss": 1.1008, "step": 7619 }, { "epoch": 0.23, "learning_rate": 4.495808047773037e-06, "loss": 1.1742, "step": 7620 }, { "epoch": 0.23, "learning_rate": 4.4956611424924055e-06, "loss": 1.1066, "step": 7621 }, { "epoch": 0.23, "learning_rate": 4.49551421821404e-06, "loss": 1.0685, "step": 7622 }, { "epoch": 0.23, "learning_rate": 4.49536727493934e-06, "loss": 1.0532, "step": 7623 }, { "epoch": 0.23, "learning_rate": 4.495220312669705e-06, "loss": 1.1357, "step": 7624 }, { "epoch": 0.23, "learning_rate": 4.495073331406533e-06, "loss": 1.0566, "step": 7625 }, { "epoch": 0.23, "learning_rate": 4.494926331151224e-06, "loss": 1.1667, "step": 7626 }, { "epoch": 0.23, "learning_rate": 4.494779311905177e-06, "loss": 1.063, "step": 7627 }, { "epoch": 0.23, "learning_rate": 4.494632273669792e-06, "loss": 1.2125, "step": 7628 }, { "epoch": 0.23, "learning_rate": 4.494485216446469e-06, "loss": 1.1958, "step": 7629 }, { "epoch": 0.23, "learning_rate": 4.494338140236606e-06, "loss": 1.0435, "step": 7630 }, { "epoch": 0.23, "learning_rate": 4.494191045041605e-06, "loss": 1.2988, "step": 7631 }, { "epoch": 0.23, "learning_rate": 4.494043930862866e-06, "loss": 1.2621, "step": 7632 }, { "epoch": 0.23, "learning_rate": 4.493896797701789e-06, "loss": 1.1115, "step": 7633 }, { "epoch": 0.23, "learning_rate": 4.493749645559775e-06, "loss": 1.1064, "step": 7634 }, { "epoch": 0.23, "learning_rate": 4.4936024744382234e-06, "loss": 1.1852, "step": 7635 }, { "epoch": 0.23, "learning_rate": 4.493455284338537e-06, "loss": 1.1333, "step": 7636 }, { "epoch": 0.23, "learning_rate": 4.493308075262117e-06, "loss": 1.1586, "step": 7637 }, { "epoch": 0.23, "learning_rate": 4.493160847210364e-06, "loss": 1.2754, "step": 7638 }, { "epoch": 0.23, "learning_rate": 4.493013600184679e-06, "loss": 1.2039, "step": 7639 }, { "epoch": 0.23, "learning_rate": 4.492866334186466e-06, "loss": 1.1598, "step": 7640 }, { "epoch": 0.23, "learning_rate": 4.4927190492171235e-06, "loss": 1.2209, "step": 7641 }, { "epoch": 0.23, "learning_rate": 4.492571745278056e-06, "loss": 1.1885, "step": 7642 }, { "epoch": 0.23, "learning_rate": 4.492424422370664e-06, "loss": 1.1296, "step": 7643 }, { "epoch": 0.23, "learning_rate": 4.492277080496354e-06, "loss": 1.2007, "step": 7644 }, { "epoch": 0.23, "learning_rate": 4.492129719656523e-06, "loss": 1.1274, "step": 7645 }, { "epoch": 0.23, "learning_rate": 4.4919823398525776e-06, "loss": 1.0345, "step": 7646 }, { "epoch": 0.23, "learning_rate": 4.49183494108592e-06, "loss": 1.1865, "step": 7647 }, { "epoch": 0.23, "learning_rate": 4.491687523357951e-06, "loss": 1.1556, "step": 7648 }, { "epoch": 0.23, "learning_rate": 4.4915400866700785e-06, "loss": 1.1703, "step": 7649 }, { "epoch": 0.23, "learning_rate": 4.4913926310237025e-06, "loss": 1.1189, "step": 7650 }, { "epoch": 0.23, "learning_rate": 4.491245156420228e-06, "loss": 1.1443, "step": 7651 }, { "epoch": 0.23, "learning_rate": 4.491097662861058e-06, "loss": 1.0957, "step": 7652 }, { "epoch": 0.23, "learning_rate": 4.490950150347598e-06, "loss": 1.0614, "step": 7653 }, { "epoch": 0.23, "learning_rate": 4.490802618881252e-06, "loss": 1.2953, "step": 7654 }, { "epoch": 0.23, "learning_rate": 4.490655068463422e-06, "loss": 1.2507, "step": 7655 }, { "epoch": 0.23, "learning_rate": 4.4905074990955155e-06, "loss": 1.2889, "step": 7656 }, { "epoch": 0.23, "learning_rate": 4.4903599107789364e-06, "loss": 1.1832, "step": 7657 }, { "epoch": 0.23, "learning_rate": 4.490212303515089e-06, "loss": 1.1581, "step": 7658 }, { "epoch": 0.23, "learning_rate": 4.49006467730538e-06, "loss": 0.9861, "step": 7659 }, { "epoch": 0.23, "learning_rate": 4.489917032151213e-06, "loss": 1.1644, "step": 7660 }, { "epoch": 0.23, "learning_rate": 4.489769368053995e-06, "loss": 1.2355, "step": 7661 }, { "epoch": 0.23, "learning_rate": 4.48962168501513e-06, "loss": 1.1821, "step": 7662 }, { "epoch": 0.23, "learning_rate": 4.4894739830360244e-06, "loss": 1.1268, "step": 7663 }, { "epoch": 0.23, "learning_rate": 4.489326262118086e-06, "loss": 1.1492, "step": 7664 }, { "epoch": 0.23, "learning_rate": 4.489178522262718e-06, "loss": 1.1359, "step": 7665 }, { "epoch": 0.23, "learning_rate": 4.48903076347133e-06, "loss": 1.0892, "step": 7666 }, { "epoch": 0.23, "learning_rate": 4.488882985745326e-06, "loss": 1.304, "step": 7667 }, { "epoch": 0.23, "learning_rate": 4.488735189086115e-06, "loss": 1.0037, "step": 7668 }, { "epoch": 0.23, "learning_rate": 4.488587373495102e-06, "loss": 1.0919, "step": 7669 }, { "epoch": 0.23, "learning_rate": 4.488439538973695e-06, "loss": 1.1897, "step": 7670 }, { "epoch": 0.23, "learning_rate": 4.488291685523301e-06, "loss": 1.1619, "step": 7671 }, { "epoch": 0.23, "learning_rate": 4.4881438131453295e-06, "loss": 1.1868, "step": 7672 }, { "epoch": 0.23, "learning_rate": 4.487995921841184e-06, "loss": 1.2424, "step": 7673 }, { "epoch": 0.23, "learning_rate": 4.4878480116122755e-06, "loss": 1.0429, "step": 7674 }, { "epoch": 0.23, "learning_rate": 4.487700082460013e-06, "loss": 1.1519, "step": 7675 }, { "epoch": 0.23, "learning_rate": 4.487552134385801e-06, "loss": 1.1557, "step": 7676 }, { "epoch": 0.23, "learning_rate": 4.4874041673910505e-06, "loss": 1.0818, "step": 7677 }, { "epoch": 0.23, "learning_rate": 4.48725618147717e-06, "loss": 1.0229, "step": 7678 }, { "epoch": 0.23, "learning_rate": 4.487108176645567e-06, "loss": 1.1047, "step": 7679 }, { "epoch": 0.23, "learning_rate": 4.4869601528976515e-06, "loss": 1.0912, "step": 7680 }, { "epoch": 0.23, "learning_rate": 4.486812110234832e-06, "loss": 1.2998, "step": 7681 }, { "epoch": 0.23, "learning_rate": 4.486664048658519e-06, "loss": 1.1847, "step": 7682 }, { "epoch": 0.23, "learning_rate": 4.4865159681701194e-06, "loss": 1.1745, "step": 7683 }, { "epoch": 0.23, "learning_rate": 4.486367868771046e-06, "loss": 1.1428, "step": 7684 }, { "epoch": 0.23, "learning_rate": 4.486219750462707e-06, "loss": 1.1951, "step": 7685 }, { "epoch": 0.23, "learning_rate": 4.486071613246512e-06, "loss": 1.2278, "step": 7686 }, { "epoch": 0.23, "learning_rate": 4.485923457123872e-06, "loss": 1.3484, "step": 7687 }, { "epoch": 0.23, "learning_rate": 4.485775282096198e-06, "loss": 1.0493, "step": 7688 }, { "epoch": 0.23, "learning_rate": 4.4856270881648986e-06, "loss": 1.0899, "step": 7689 }, { "epoch": 0.23, "learning_rate": 4.485478875331386e-06, "loss": 1.2325, "step": 7690 }, { "epoch": 0.23, "learning_rate": 4.485330643597071e-06, "loss": 1.1107, "step": 7691 }, { "epoch": 0.23, "learning_rate": 4.485182392963364e-06, "loss": 1.1384, "step": 7692 }, { "epoch": 0.23, "learning_rate": 4.485034123431677e-06, "loss": 1.2216, "step": 7693 }, { "epoch": 0.23, "learning_rate": 4.484885835003421e-06, "loss": 1.0764, "step": 7694 }, { "epoch": 0.23, "learning_rate": 4.484737527680007e-06, "loss": 1.1384, "step": 7695 }, { "epoch": 0.23, "learning_rate": 4.484589201462849e-06, "loss": 1.1206, "step": 7696 }, { "epoch": 0.23, "learning_rate": 4.484440856353357e-06, "loss": 1.0457, "step": 7697 }, { "epoch": 0.23, "learning_rate": 4.484292492352944e-06, "loss": 1.1541, "step": 7698 }, { "epoch": 0.23, "learning_rate": 4.484144109463022e-06, "loss": 1.0773, "step": 7699 }, { "epoch": 0.23, "learning_rate": 4.4839957076850036e-06, "loss": 1.019, "step": 7700 }, { "epoch": 0.23, "learning_rate": 4.483847287020302e-06, "loss": 1.1041, "step": 7701 }, { "epoch": 0.23, "learning_rate": 4.483698847470329e-06, "loss": 1.0406, "step": 7702 }, { "epoch": 0.23, "learning_rate": 4.483550389036499e-06, "loss": 1.0851, "step": 7703 }, { "epoch": 0.23, "learning_rate": 4.4834019117202245e-06, "loss": 1.1461, "step": 7704 }, { "epoch": 0.23, "learning_rate": 4.483253415522918e-06, "loss": 1.218, "step": 7705 }, { "epoch": 0.23, "learning_rate": 4.483104900445996e-06, "loss": 1.2133, "step": 7706 }, { "epoch": 0.23, "learning_rate": 4.48295636649087e-06, "loss": 1.1444, "step": 7707 }, { "epoch": 0.23, "learning_rate": 4.482807813658953e-06, "loss": 1.1215, "step": 7708 }, { "epoch": 0.23, "learning_rate": 4.482659241951661e-06, "loss": 1.1954, "step": 7709 }, { "epoch": 0.23, "learning_rate": 4.482510651370409e-06, "loss": 1.1866, "step": 7710 }, { "epoch": 0.23, "learning_rate": 4.482362041916609e-06, "loss": 1.1661, "step": 7711 }, { "epoch": 0.23, "learning_rate": 4.482213413591678e-06, "loss": 1.0798, "step": 7712 }, { "epoch": 0.23, "learning_rate": 4.48206476639703e-06, "loss": 1.1662, "step": 7713 }, { "epoch": 0.23, "learning_rate": 4.48191610033408e-06, "loss": 1.1285, "step": 7714 }, { "epoch": 0.23, "learning_rate": 4.481767415404242e-06, "loss": 1.086, "step": 7715 }, { "epoch": 0.23, "learning_rate": 4.481618711608935e-06, "loss": 1.2285, "step": 7716 }, { "epoch": 0.23, "learning_rate": 4.481469988949571e-06, "loss": 1.1998, "step": 7717 }, { "epoch": 0.23, "learning_rate": 4.4813212474275664e-06, "loss": 1.3405, "step": 7718 }, { "epoch": 0.23, "learning_rate": 4.481172487044338e-06, "loss": 1.1151, "step": 7719 }, { "epoch": 0.23, "learning_rate": 4.481023707801302e-06, "loss": 1.1726, "step": 7720 }, { "epoch": 0.23, "learning_rate": 4.480874909699875e-06, "loss": 1.0681, "step": 7721 }, { "epoch": 0.23, "learning_rate": 4.480726092741472e-06, "loss": 1.1516, "step": 7722 }, { "epoch": 0.23, "learning_rate": 4.480577256927511e-06, "loss": 1.1371, "step": 7723 }, { "epoch": 0.23, "learning_rate": 4.480428402259408e-06, "loss": 1.1968, "step": 7724 }, { "epoch": 0.23, "learning_rate": 4.480279528738581e-06, "loss": 1.0883, "step": 7725 }, { "epoch": 0.23, "learning_rate": 4.480130636366446e-06, "loss": 1.2194, "step": 7726 }, { "epoch": 0.23, "learning_rate": 4.479981725144421e-06, "loss": 1.074, "step": 7727 }, { "epoch": 0.23, "learning_rate": 4.479832795073924e-06, "loss": 1.117, "step": 7728 }, { "epoch": 0.23, "learning_rate": 4.479683846156372e-06, "loss": 1.1028, "step": 7729 }, { "epoch": 0.23, "learning_rate": 4.479534878393184e-06, "loss": 1.1432, "step": 7730 }, { "epoch": 0.23, "learning_rate": 4.479385891785777e-06, "loss": 1.1314, "step": 7731 }, { "epoch": 0.23, "learning_rate": 4.479236886335569e-06, "loss": 1.0537, "step": 7732 }, { "epoch": 0.23, "learning_rate": 4.479087862043979e-06, "loss": 1.0533, "step": 7733 }, { "epoch": 0.23, "learning_rate": 4.478938818912427e-06, "loss": 1.1381, "step": 7734 }, { "epoch": 0.23, "learning_rate": 4.478789756942329e-06, "loss": 1.1274, "step": 7735 }, { "epoch": 0.23, "learning_rate": 4.478640676135106e-06, "loss": 1.1525, "step": 7736 }, { "epoch": 0.23, "learning_rate": 4.478491576492177e-06, "loss": 1.2164, "step": 7737 }, { "epoch": 0.23, "learning_rate": 4.478342458014962e-06, "loss": 1.1143, "step": 7738 }, { "epoch": 0.23, "learning_rate": 4.478193320704878e-06, "loss": 1.1881, "step": 7739 }, { "epoch": 0.23, "learning_rate": 4.478044164563347e-06, "loss": 1.1654, "step": 7740 }, { "epoch": 0.23, "learning_rate": 4.4778949895917875e-06, "loss": 1.0677, "step": 7741 }, { "epoch": 0.23, "learning_rate": 4.4777457957916215e-06, "loss": 1.1476, "step": 7742 }, { "epoch": 0.23, "learning_rate": 4.477596583164268e-06, "loss": 1.1245, "step": 7743 }, { "epoch": 0.23, "learning_rate": 4.477447351711146e-06, "loss": 1.1528, "step": 7744 }, { "epoch": 0.23, "learning_rate": 4.4772981014336784e-06, "loss": 1.1111, "step": 7745 }, { "epoch": 0.23, "learning_rate": 4.4771488323332854e-06, "loss": 1.1216, "step": 7746 }, { "epoch": 0.23, "learning_rate": 4.4769995444113875e-06, "loss": 1.1108, "step": 7747 }, { "epoch": 0.23, "learning_rate": 4.476850237669407e-06, "loss": 1.1512, "step": 7748 }, { "epoch": 0.23, "learning_rate": 4.476700912108763e-06, "loss": 1.2354, "step": 7749 }, { "epoch": 0.23, "learning_rate": 4.476551567730879e-06, "loss": 1.1235, "step": 7750 }, { "epoch": 0.23, "learning_rate": 4.4764022045371756e-06, "loss": 1.2336, "step": 7751 }, { "epoch": 0.23, "learning_rate": 4.476252822529075e-06, "loss": 1.0983, "step": 7752 }, { "epoch": 0.23, "learning_rate": 4.476103421708e-06, "loss": 1.1635, "step": 7753 }, { "epoch": 0.23, "learning_rate": 4.475954002075372e-06, "loss": 1.0657, "step": 7754 }, { "epoch": 0.23, "learning_rate": 4.4758045636326135e-06, "loss": 1.1829, "step": 7755 }, { "epoch": 0.23, "learning_rate": 4.475655106381147e-06, "loss": 1.2686, "step": 7756 }, { "epoch": 0.23, "learning_rate": 4.475505630322395e-06, "loss": 1.1935, "step": 7757 }, { "epoch": 0.23, "learning_rate": 4.475356135457781e-06, "loss": 1.1135, "step": 7758 }, { "epoch": 0.23, "learning_rate": 4.475206621788729e-06, "loss": 1.0898, "step": 7759 }, { "epoch": 0.23, "learning_rate": 4.47505708931666e-06, "loss": 1.2333, "step": 7760 }, { "epoch": 0.23, "learning_rate": 4.474907538043e-06, "loss": 1.2089, "step": 7761 }, { "epoch": 0.23, "learning_rate": 4.47475796796917e-06, "loss": 1.1323, "step": 7762 }, { "epoch": 0.23, "learning_rate": 4.474608379096595e-06, "loss": 1.2224, "step": 7763 }, { "epoch": 0.23, "learning_rate": 4.474458771426701e-06, "loss": 1.1641, "step": 7764 }, { "epoch": 0.23, "learning_rate": 4.4743091449609096e-06, "loss": 1.1028, "step": 7765 }, { "epoch": 0.23, "learning_rate": 4.474159499700645e-06, "loss": 1.1174, "step": 7766 }, { "epoch": 0.23, "learning_rate": 4.474009835647334e-06, "loss": 1.0869, "step": 7767 }, { "epoch": 0.23, "learning_rate": 4.473860152802399e-06, "loss": 1.1453, "step": 7768 }, { "epoch": 0.23, "learning_rate": 4.473710451167268e-06, "loss": 1.1068, "step": 7769 }, { "epoch": 0.23, "learning_rate": 4.473560730743362e-06, "loss": 1.1529, "step": 7770 }, { "epoch": 0.23, "learning_rate": 4.473410991532109e-06, "loss": 1.1741, "step": 7771 }, { "epoch": 0.23, "learning_rate": 4.473261233534935e-06, "loss": 1.0616, "step": 7772 }, { "epoch": 0.23, "learning_rate": 4.473111456753263e-06, "loss": 1.161, "step": 7773 }, { "epoch": 0.23, "learning_rate": 4.47296166118852e-06, "loss": 1.2427, "step": 7774 }, { "epoch": 0.23, "learning_rate": 4.472811846842133e-06, "loss": 1.0717, "step": 7775 }, { "epoch": 0.23, "learning_rate": 4.4726620137155266e-06, "loss": 1.128, "step": 7776 }, { "epoch": 0.23, "learning_rate": 4.472512161810129e-06, "loss": 1.1126, "step": 7777 }, { "epoch": 0.23, "learning_rate": 4.472362291127364e-06, "loss": 1.1876, "step": 7778 }, { "epoch": 0.23, "learning_rate": 4.472212401668661e-06, "loss": 1.2441, "step": 7779 }, { "epoch": 0.23, "learning_rate": 4.472062493435446e-06, "loss": 1.1829, "step": 7780 }, { "epoch": 0.23, "learning_rate": 4.471912566429145e-06, "loss": 1.0539, "step": 7781 }, { "epoch": 0.23, "learning_rate": 4.4717626206511875e-06, "loss": 1.162, "step": 7782 }, { "epoch": 0.23, "learning_rate": 4.471612656102998e-06, "loss": 1.1593, "step": 7783 }, { "epoch": 0.23, "learning_rate": 4.471462672786006e-06, "loss": 1.1659, "step": 7784 }, { "epoch": 0.23, "learning_rate": 4.47131267070164e-06, "loss": 1.2582, "step": 7785 }, { "epoch": 0.23, "learning_rate": 4.471162649851325e-06, "loss": 1.1015, "step": 7786 }, { "epoch": 0.23, "learning_rate": 4.4710126102364914e-06, "loss": 1.1376, "step": 7787 }, { "epoch": 0.23, "learning_rate": 4.470862551858568e-06, "loss": 1.2151, "step": 7788 }, { "epoch": 0.23, "learning_rate": 4.4707124747189814e-06, "loss": 1.105, "step": 7789 }, { "epoch": 0.23, "learning_rate": 4.470562378819161e-06, "loss": 1.0871, "step": 7790 }, { "epoch": 0.23, "learning_rate": 4.4704122641605365e-06, "loss": 1.0297, "step": 7791 }, { "epoch": 0.23, "learning_rate": 4.470262130744536e-06, "loss": 1.2576, "step": 7792 }, { "epoch": 0.23, "learning_rate": 4.470111978572589e-06, "loss": 1.348, "step": 7793 }, { "epoch": 0.23, "learning_rate": 4.469961807646124e-06, "loss": 1.1223, "step": 7794 }, { "epoch": 0.23, "learning_rate": 4.469811617966572e-06, "loss": 1.1783, "step": 7795 }, { "epoch": 0.23, "learning_rate": 4.469661409535363e-06, "loss": 1.1005, "step": 7796 }, { "epoch": 0.23, "learning_rate": 4.4695111823539245e-06, "loss": 1.1102, "step": 7797 }, { "epoch": 0.23, "learning_rate": 4.469360936423689e-06, "loss": 1.0655, "step": 7798 }, { "epoch": 0.23, "learning_rate": 4.469210671746085e-06, "loss": 1.1772, "step": 7799 }, { "epoch": 0.23, "learning_rate": 4.469060388322545e-06, "loss": 1.0846, "step": 7800 }, { "epoch": 0.24, "learning_rate": 4.468910086154498e-06, "loss": 1.1459, "step": 7801 }, { "epoch": 0.24, "learning_rate": 4.4687597652433745e-06, "loss": 1.0778, "step": 7802 }, { "epoch": 0.24, "learning_rate": 4.468609425590607e-06, "loss": 1.0925, "step": 7803 }, { "epoch": 0.24, "learning_rate": 4.468459067197626e-06, "loss": 1.251, "step": 7804 }, { "epoch": 0.24, "learning_rate": 4.468308690065862e-06, "loss": 1.2383, "step": 7805 }, { "epoch": 0.24, "learning_rate": 4.4681582941967475e-06, "loss": 1.2142, "step": 7806 }, { "epoch": 0.24, "learning_rate": 4.468007879591714e-06, "loss": 1.1631, "step": 7807 }, { "epoch": 0.24, "learning_rate": 4.467857446252193e-06, "loss": 1.0679, "step": 7808 }, { "epoch": 0.24, "learning_rate": 4.467706994179618e-06, "loss": 1.2328, "step": 7809 }, { "epoch": 0.24, "learning_rate": 4.4675565233754196e-06, "loss": 1.1619, "step": 7810 }, { "epoch": 0.24, "learning_rate": 4.46740603384103e-06, "loss": 1.1832, "step": 7811 }, { "epoch": 0.24, "learning_rate": 4.467255525577883e-06, "loss": 1.1911, "step": 7812 }, { "epoch": 0.24, "learning_rate": 4.46710499858741e-06, "loss": 1.1101, "step": 7813 }, { "epoch": 0.24, "learning_rate": 4.4669544528710465e-06, "loss": 1.1216, "step": 7814 }, { "epoch": 0.24, "learning_rate": 4.466803888430223e-06, "loss": 1.2412, "step": 7815 }, { "epoch": 0.24, "learning_rate": 4.4666533052663735e-06, "loss": 1.2148, "step": 7816 }, { "epoch": 0.24, "learning_rate": 4.4665027033809316e-06, "loss": 1.1531, "step": 7817 }, { "epoch": 0.24, "learning_rate": 4.466352082775331e-06, "loss": 1.1412, "step": 7818 }, { "epoch": 0.24, "learning_rate": 4.466201443451007e-06, "loss": 1.1299, "step": 7819 }, { "epoch": 0.24, "learning_rate": 4.466050785409391e-06, "loss": 1.2225, "step": 7820 }, { "epoch": 0.24, "learning_rate": 4.465900108651918e-06, "loss": 1.004, "step": 7821 }, { "epoch": 0.24, "learning_rate": 4.465749413180024e-06, "loss": 1.167, "step": 7822 }, { "epoch": 0.24, "learning_rate": 4.465598698995142e-06, "loss": 1.2143, "step": 7823 }, { "epoch": 0.24, "learning_rate": 4.465447966098707e-06, "loss": 1.3397, "step": 7824 }, { "epoch": 0.24, "learning_rate": 4.465297214492153e-06, "loss": 1.2832, "step": 7825 }, { "epoch": 0.24, "learning_rate": 4.4651464441769165e-06, "loss": 1.104, "step": 7826 }, { "epoch": 0.24, "learning_rate": 4.464995655154432e-06, "loss": 1.0665, "step": 7827 }, { "epoch": 0.24, "learning_rate": 4.464844847426137e-06, "loss": 1.1715, "step": 7828 }, { "epoch": 0.24, "learning_rate": 4.464694020993464e-06, "loss": 1.0663, "step": 7829 }, { "epoch": 0.24, "learning_rate": 4.46454317585785e-06, "loss": 1.1796, "step": 7830 }, { "epoch": 0.24, "learning_rate": 4.464392312020732e-06, "loss": 1.1915, "step": 7831 }, { "epoch": 0.24, "learning_rate": 4.464241429483545e-06, "loss": 1.1491, "step": 7832 }, { "epoch": 0.24, "learning_rate": 4.464090528247725e-06, "loss": 1.1212, "step": 7833 }, { "epoch": 0.24, "learning_rate": 4.463939608314709e-06, "loss": 1.1282, "step": 7834 }, { "epoch": 0.24, "learning_rate": 4.463788669685935e-06, "loss": 1.1758, "step": 7835 }, { "epoch": 0.24, "learning_rate": 4.463637712362837e-06, "loss": 1.3246, "step": 7836 }, { "epoch": 0.24, "learning_rate": 4.463486736346855e-06, "loss": 1.1311, "step": 7837 }, { "epoch": 0.24, "learning_rate": 4.463335741639424e-06, "loss": 1.0565, "step": 7838 }, { "epoch": 0.24, "learning_rate": 4.4631847282419825e-06, "loss": 1.1441, "step": 7839 }, { "epoch": 0.24, "learning_rate": 4.463033696155968e-06, "loss": 1.1592, "step": 7840 }, { "epoch": 0.24, "learning_rate": 4.462882645382819e-06, "loss": 1.0747, "step": 7841 }, { "epoch": 0.24, "learning_rate": 4.462731575923972e-06, "loss": 1.2037, "step": 7842 }, { "epoch": 0.24, "learning_rate": 4.462580487780866e-06, "loss": 1.1852, "step": 7843 }, { "epoch": 0.24, "learning_rate": 4.462429380954938e-06, "loss": 1.1826, "step": 7844 }, { "epoch": 0.24, "learning_rate": 4.462278255447628e-06, "loss": 1.2198, "step": 7845 }, { "epoch": 0.24, "learning_rate": 4.462127111260374e-06, "loss": 1.1205, "step": 7846 }, { "epoch": 0.24, "learning_rate": 4.461975948394615e-06, "loss": 1.1631, "step": 7847 }, { "epoch": 0.24, "learning_rate": 4.46182476685179e-06, "loss": 1.2183, "step": 7848 }, { "epoch": 0.24, "learning_rate": 4.4616735666333376e-06, "loss": 1.2119, "step": 7849 }, { "epoch": 0.24, "learning_rate": 4.461522347740698e-06, "loss": 1.2028, "step": 7850 }, { "epoch": 0.24, "learning_rate": 4.461371110175311e-06, "loss": 1.2388, "step": 7851 }, { "epoch": 0.24, "learning_rate": 4.461219853938615e-06, "loss": 1.2614, "step": 7852 }, { "epoch": 0.24, "learning_rate": 4.461068579032049e-06, "loss": 1.235, "step": 7853 }, { "epoch": 0.24, "learning_rate": 4.460917285457057e-06, "loss": 1.1889, "step": 7854 }, { "epoch": 0.24, "learning_rate": 4.460765973215076e-06, "loss": 1.2608, "step": 7855 }, { "epoch": 0.24, "learning_rate": 4.460614642307547e-06, "loss": 1.183, "step": 7856 }, { "epoch": 0.24, "learning_rate": 4.460463292735912e-06, "loss": 1.1989, "step": 7857 }, { "epoch": 0.24, "learning_rate": 4.4603119245016095e-06, "loss": 1.0407, "step": 7858 }, { "epoch": 0.24, "learning_rate": 4.460160537606081e-06, "loss": 1.0699, "step": 7859 }, { "epoch": 0.24, "learning_rate": 4.46000913205077e-06, "loss": 1.2549, "step": 7860 }, { "epoch": 0.24, "learning_rate": 4.4598577078371145e-06, "loss": 1.1674, "step": 7861 }, { "epoch": 0.24, "learning_rate": 4.459706264966558e-06, "loss": 1.0673, "step": 7862 }, { "epoch": 0.24, "learning_rate": 4.459554803440542e-06, "loss": 1.0482, "step": 7863 }, { "epoch": 0.24, "learning_rate": 4.459403323260508e-06, "loss": 1.1592, "step": 7864 }, { "epoch": 0.24, "learning_rate": 4.4592518244278986e-06, "loss": 1.1667, "step": 7865 }, { "epoch": 0.24, "learning_rate": 4.459100306944154e-06, "loss": 1.0671, "step": 7866 }, { "epoch": 0.24, "learning_rate": 4.458948770810718e-06, "loss": 1.1504, "step": 7867 }, { "epoch": 0.24, "learning_rate": 4.458797216029034e-06, "loss": 1.2781, "step": 7868 }, { "epoch": 0.24, "learning_rate": 4.458645642600544e-06, "loss": 1.1608, "step": 7869 }, { "epoch": 0.24, "learning_rate": 4.45849405052669e-06, "loss": 1.1036, "step": 7870 }, { "epoch": 0.24, "learning_rate": 4.458342439808917e-06, "loss": 1.1742, "step": 7871 }, { "epoch": 0.24, "learning_rate": 4.458190810448667e-06, "loss": 1.0813, "step": 7872 }, { "epoch": 0.24, "learning_rate": 4.458039162447383e-06, "loss": 1.1907, "step": 7873 }, { "epoch": 0.24, "learning_rate": 4.457887495806509e-06, "loss": 1.1782, "step": 7874 }, { "epoch": 0.24, "learning_rate": 4.4577358105274895e-06, "loss": 1.1801, "step": 7875 }, { "epoch": 0.24, "learning_rate": 4.457584106611768e-06, "loss": 1.2303, "step": 7876 }, { "epoch": 0.24, "learning_rate": 4.457432384060789e-06, "loss": 1.0813, "step": 7877 }, { "epoch": 0.24, "learning_rate": 4.457280642875995e-06, "loss": 1.2009, "step": 7878 }, { "epoch": 0.24, "learning_rate": 4.457128883058833e-06, "loss": 1.2347, "step": 7879 }, { "epoch": 0.24, "learning_rate": 4.456977104610747e-06, "loss": 1.0742, "step": 7880 }, { "epoch": 0.24, "learning_rate": 4.456825307533181e-06, "loss": 1.1774, "step": 7881 }, { "epoch": 0.24, "learning_rate": 4.45667349182758e-06, "loss": 1.0427, "step": 7882 }, { "epoch": 0.24, "learning_rate": 4.45652165749539e-06, "loss": 1.1793, "step": 7883 }, { "epoch": 0.24, "learning_rate": 4.456369804538057e-06, "loss": 1.1595, "step": 7884 }, { "epoch": 0.24, "learning_rate": 4.4562179329570244e-06, "loss": 1.0846, "step": 7885 }, { "epoch": 0.24, "learning_rate": 4.45606604275374e-06, "loss": 1.0973, "step": 7886 }, { "epoch": 0.24, "learning_rate": 4.455914133929649e-06, "loss": 1.2338, "step": 7887 }, { "epoch": 0.24, "learning_rate": 4.455762206486197e-06, "loss": 1.1283, "step": 7888 }, { "epoch": 0.24, "learning_rate": 4.455610260424831e-06, "loss": 1.1552, "step": 7889 }, { "epoch": 0.24, "learning_rate": 4.455458295746997e-06, "loss": 1.0464, "step": 7890 }, { "epoch": 0.24, "learning_rate": 4.455306312454142e-06, "loss": 1.0989, "step": 7891 }, { "epoch": 0.24, "learning_rate": 4.4551543105477125e-06, "loss": 1.119, "step": 7892 }, { "epoch": 0.24, "learning_rate": 4.455002290029155e-06, "loss": 1.0106, "step": 7893 }, { "epoch": 0.24, "learning_rate": 4.454850250899918e-06, "loss": 1.1262, "step": 7894 }, { "epoch": 0.24, "learning_rate": 4.4546981931614474e-06, "loss": 1.0757, "step": 7895 }, { "epoch": 0.24, "learning_rate": 4.4545461168151924e-06, "loss": 1.1639, "step": 7896 }, { "epoch": 0.24, "learning_rate": 4.454394021862599e-06, "loss": 1.0818, "step": 7897 }, { "epoch": 0.24, "learning_rate": 4.454241908305116e-06, "loss": 1.1544, "step": 7898 }, { "epoch": 0.24, "learning_rate": 4.454089776144192e-06, "loss": 1.1641, "step": 7899 }, { "epoch": 0.24, "learning_rate": 4.4539376253812735e-06, "loss": 1.2039, "step": 7900 }, { "epoch": 0.24, "learning_rate": 4.45378545601781e-06, "loss": 1.0464, "step": 7901 }, { "epoch": 0.24, "learning_rate": 4.453633268055249e-06, "loss": 1.2211, "step": 7902 }, { "epoch": 0.24, "learning_rate": 4.453481061495042e-06, "loss": 1.0961, "step": 7903 }, { "epoch": 0.24, "learning_rate": 4.4533288363386355e-06, "loss": 1.1863, "step": 7904 }, { "epoch": 0.24, "learning_rate": 4.453176592587479e-06, "loss": 1.1955, "step": 7905 }, { "epoch": 0.24, "learning_rate": 4.453024330243022e-06, "loss": 1.2641, "step": 7906 }, { "epoch": 0.24, "learning_rate": 4.452872049306714e-06, "loss": 1.1568, "step": 7907 }, { "epoch": 0.24, "learning_rate": 4.452719749780005e-06, "loss": 1.1518, "step": 7908 }, { "epoch": 0.24, "learning_rate": 4.4525674316643445e-06, "loss": 1.1196, "step": 7909 }, { "epoch": 0.24, "learning_rate": 4.4524150949611815e-06, "loss": 1.1393, "step": 7910 }, { "epoch": 0.24, "learning_rate": 4.4522627396719675e-06, "loss": 1.1055, "step": 7911 }, { "epoch": 0.24, "learning_rate": 4.452110365798153e-06, "loss": 1.2839, "step": 7912 }, { "epoch": 0.24, "learning_rate": 4.451957973341188e-06, "loss": 1.1273, "step": 7913 }, { "epoch": 0.24, "learning_rate": 4.451805562302523e-06, "loss": 1.2091, "step": 7914 }, { "epoch": 0.24, "learning_rate": 4.451653132683608e-06, "loss": 1.1501, "step": 7915 }, { "epoch": 0.24, "learning_rate": 4.451500684485896e-06, "loss": 1.0739, "step": 7916 }, { "epoch": 0.24, "learning_rate": 4.451348217710838e-06, "loss": 1.1884, "step": 7917 }, { "epoch": 0.24, "learning_rate": 4.451195732359884e-06, "loss": 1.1425, "step": 7918 }, { "epoch": 0.24, "learning_rate": 4.451043228434486e-06, "loss": 1.0618, "step": 7919 }, { "epoch": 0.24, "learning_rate": 4.4508907059360964e-06, "loss": 1.1638, "step": 7920 }, { "epoch": 0.24, "learning_rate": 4.450738164866168e-06, "loss": 1.0984, "step": 7921 }, { "epoch": 0.24, "learning_rate": 4.450585605226151e-06, "loss": 1.1284, "step": 7922 }, { "epoch": 0.24, "learning_rate": 4.450433027017497e-06, "loss": 1.2583, "step": 7923 }, { "epoch": 0.24, "learning_rate": 4.450280430241663e-06, "loss": 1.0807, "step": 7924 }, { "epoch": 0.24, "learning_rate": 4.450127814900096e-06, "loss": 1.1036, "step": 7925 }, { "epoch": 0.24, "learning_rate": 4.449975180994252e-06, "loss": 1.0587, "step": 7926 }, { "epoch": 0.24, "learning_rate": 4.449822528525584e-06, "loss": 1.1541, "step": 7927 }, { "epoch": 0.24, "learning_rate": 4.449669857495544e-06, "loss": 1.1586, "step": 7928 }, { "epoch": 0.24, "learning_rate": 4.449517167905586e-06, "loss": 1.2906, "step": 7929 }, { "epoch": 0.24, "learning_rate": 4.449364459757164e-06, "loss": 1.3253, "step": 7930 }, { "epoch": 0.24, "learning_rate": 4.4492117330517315e-06, "loss": 1.2844, "step": 7931 }, { "epoch": 0.24, "learning_rate": 4.449058987790741e-06, "loss": 1.053, "step": 7932 }, { "epoch": 0.24, "learning_rate": 4.448906223975648e-06, "loss": 1.0742, "step": 7933 }, { "epoch": 0.24, "learning_rate": 4.448753441607907e-06, "loss": 1.1511, "step": 7934 }, { "epoch": 0.24, "learning_rate": 4.4486006406889705e-06, "loss": 1.1647, "step": 7935 }, { "epoch": 0.24, "learning_rate": 4.448447821220296e-06, "loss": 1.2203, "step": 7936 }, { "epoch": 0.24, "learning_rate": 4.448294983203336e-06, "loss": 1.113, "step": 7937 }, { "epoch": 0.24, "learning_rate": 4.448142126639545e-06, "loss": 1.138, "step": 7938 }, { "epoch": 0.24, "learning_rate": 4.44798925153038e-06, "loss": 1.0695, "step": 7939 }, { "epoch": 0.24, "learning_rate": 4.447836357877296e-06, "loss": 1.1426, "step": 7940 }, { "epoch": 0.24, "learning_rate": 4.447683445681748e-06, "loss": 1.1262, "step": 7941 }, { "epoch": 0.24, "learning_rate": 4.447530514945191e-06, "loss": 1.0544, "step": 7942 }, { "epoch": 0.24, "learning_rate": 4.447377565669081e-06, "loss": 1.1482, "step": 7943 }, { "epoch": 0.24, "learning_rate": 4.447224597854875e-06, "loss": 1.1436, "step": 7944 }, { "epoch": 0.24, "learning_rate": 4.447071611504029e-06, "loss": 1.2139, "step": 7945 }, { "epoch": 0.24, "learning_rate": 4.446918606617999e-06, "loss": 1.0849, "step": 7946 }, { "epoch": 0.24, "learning_rate": 4.446765583198242e-06, "loss": 1.1539, "step": 7947 }, { "epoch": 0.24, "learning_rate": 4.446612541246213e-06, "loss": 1.1136, "step": 7948 }, { "epoch": 0.24, "learning_rate": 4.446459480763371e-06, "loss": 1.1942, "step": 7949 }, { "epoch": 0.24, "learning_rate": 4.446306401751172e-06, "loss": 1.2816, "step": 7950 }, { "epoch": 0.24, "learning_rate": 4.446153304211074e-06, "loss": 1.1587, "step": 7951 }, { "epoch": 0.24, "learning_rate": 4.446000188144532e-06, "loss": 1.1858, "step": 7952 }, { "epoch": 0.24, "learning_rate": 4.445847053553008e-06, "loss": 1.1284, "step": 7953 }, { "epoch": 0.24, "learning_rate": 4.445693900437955e-06, "loss": 1.1808, "step": 7954 }, { "epoch": 0.24, "learning_rate": 4.445540728800834e-06, "loss": 1.1431, "step": 7955 }, { "epoch": 0.24, "learning_rate": 4.445387538643102e-06, "loss": 1.2555, "step": 7956 }, { "epoch": 0.24, "learning_rate": 4.445234329966218e-06, "loss": 1.0815, "step": 7957 }, { "epoch": 0.24, "learning_rate": 4.44508110277164e-06, "loss": 1.1338, "step": 7958 }, { "epoch": 0.24, "learning_rate": 4.4449278570608264e-06, "loss": 1.1624, "step": 7959 }, { "epoch": 0.24, "learning_rate": 4.444774592835236e-06, "loss": 1.0977, "step": 7960 }, { "epoch": 0.24, "learning_rate": 4.444621310096329e-06, "loss": 1.1797, "step": 7961 }, { "epoch": 0.24, "learning_rate": 4.444468008845563e-06, "loss": 1.1359, "step": 7962 }, { "epoch": 0.24, "learning_rate": 4.444314689084398e-06, "loss": 1.2845, "step": 7963 }, { "epoch": 0.24, "learning_rate": 4.444161350814295e-06, "loss": 1.0662, "step": 7964 }, { "epoch": 0.24, "learning_rate": 4.4440079940367105e-06, "loss": 1.0358, "step": 7965 }, { "epoch": 0.24, "learning_rate": 4.4438546187531066e-06, "loss": 1.0928, "step": 7966 }, { "epoch": 0.24, "learning_rate": 4.443701224964943e-06, "loss": 1.2373, "step": 7967 }, { "epoch": 0.24, "learning_rate": 4.44354781267368e-06, "loss": 1.2357, "step": 7968 }, { "epoch": 0.24, "learning_rate": 4.443394381880778e-06, "loss": 1.0406, "step": 7969 }, { "epoch": 0.24, "learning_rate": 4.443240932587697e-06, "loss": 1.1857, "step": 7970 }, { "epoch": 0.24, "learning_rate": 4.4430874647958985e-06, "loss": 1.1573, "step": 7971 }, { "epoch": 0.24, "learning_rate": 4.442933978506843e-06, "loss": 1.1655, "step": 7972 }, { "epoch": 0.24, "learning_rate": 4.442780473721993e-06, "loss": 1.207, "step": 7973 }, { "epoch": 0.24, "learning_rate": 4.442626950442807e-06, "loss": 1.1916, "step": 7974 }, { "epoch": 0.24, "learning_rate": 4.442473408670748e-06, "loss": 1.1768, "step": 7975 }, { "epoch": 0.24, "learning_rate": 4.442319848407279e-06, "loss": 1.191, "step": 7976 }, { "epoch": 0.24, "learning_rate": 4.442166269653859e-06, "loss": 1.1396, "step": 7977 }, { "epoch": 0.24, "learning_rate": 4.442012672411953e-06, "loss": 1.107, "step": 7978 }, { "epoch": 0.24, "learning_rate": 4.44185905668302e-06, "loss": 1.2402, "step": 7979 }, { "epoch": 0.24, "learning_rate": 4.441705422468525e-06, "loss": 1.2397, "step": 7980 }, { "epoch": 0.24, "learning_rate": 4.44155176976993e-06, "loss": 1.0179, "step": 7981 }, { "epoch": 0.24, "learning_rate": 4.441398098588696e-06, "loss": 1.1895, "step": 7982 }, { "epoch": 0.24, "learning_rate": 4.441244408926288e-06, "loss": 1.1206, "step": 7983 }, { "epoch": 0.24, "learning_rate": 4.441090700784167e-06, "loss": 0.9675, "step": 7984 }, { "epoch": 0.24, "learning_rate": 4.440936974163799e-06, "loss": 1.1792, "step": 7985 }, { "epoch": 0.24, "learning_rate": 4.440783229066645e-06, "loss": 1.1204, "step": 7986 }, { "epoch": 0.24, "learning_rate": 4.440629465494169e-06, "loss": 1.2523, "step": 7987 }, { "epoch": 0.24, "learning_rate": 4.4404756834478366e-06, "loss": 1.1115, "step": 7988 }, { "epoch": 0.24, "learning_rate": 4.440321882929109e-06, "loss": 1.0291, "step": 7989 }, { "epoch": 0.24, "learning_rate": 4.440168063939452e-06, "loss": 1.2223, "step": 7990 }, { "epoch": 0.24, "learning_rate": 4.440014226480329e-06, "loss": 0.9936, "step": 7991 }, { "epoch": 0.24, "learning_rate": 4.439860370553205e-06, "loss": 1.1622, "step": 7992 }, { "epoch": 0.24, "learning_rate": 4.4397064961595445e-06, "loss": 1.2214, "step": 7993 }, { "epoch": 0.24, "learning_rate": 4.439552603300813e-06, "loss": 1.0776, "step": 7994 }, { "epoch": 0.24, "learning_rate": 4.4393986919784745e-06, "loss": 1.2139, "step": 7995 }, { "epoch": 0.24, "learning_rate": 4.439244762193994e-06, "loss": 1.0912, "step": 7996 }, { "epoch": 0.24, "learning_rate": 4.439090813948838e-06, "loss": 1.1528, "step": 7997 }, { "epoch": 0.24, "learning_rate": 4.438936847244471e-06, "loss": 1.1414, "step": 7998 }, { "epoch": 0.24, "learning_rate": 4.438782862082359e-06, "loss": 1.1915, "step": 7999 }, { "epoch": 0.24, "learning_rate": 4.438628858463968e-06, "loss": 1.2137, "step": 8000 }, { "epoch": 0.24, "learning_rate": 4.438474836390765e-06, "loss": 1.1593, "step": 8001 }, { "epoch": 0.24, "learning_rate": 4.438320795864214e-06, "loss": 1.0856, "step": 8002 }, { "epoch": 0.24, "learning_rate": 4.438166736885782e-06, "loss": 1.1267, "step": 8003 }, { "epoch": 0.24, "learning_rate": 4.438012659456937e-06, "loss": 1.1837, "step": 8004 }, { "epoch": 0.24, "learning_rate": 4.437858563579145e-06, "loss": 1.1456, "step": 8005 }, { "epoch": 0.24, "learning_rate": 4.437704449253872e-06, "loss": 1.0795, "step": 8006 }, { "epoch": 0.24, "learning_rate": 4.437550316482586e-06, "loss": 1.1174, "step": 8007 }, { "epoch": 0.24, "learning_rate": 4.437396165266755e-06, "loss": 1.2197, "step": 8008 }, { "epoch": 0.24, "learning_rate": 4.437241995607845e-06, "loss": 1.1523, "step": 8009 }, { "epoch": 0.24, "learning_rate": 4.437087807507324e-06, "loss": 1.254, "step": 8010 }, { "epoch": 0.24, "learning_rate": 4.436933600966661e-06, "loss": 1.1293, "step": 8011 }, { "epoch": 0.24, "learning_rate": 4.436779375987322e-06, "loss": 1.1516, "step": 8012 }, { "epoch": 0.24, "learning_rate": 4.436625132570776e-06, "loss": 1.0793, "step": 8013 }, { "epoch": 0.24, "learning_rate": 4.4364708707184925e-06, "loss": 1.064, "step": 8014 }, { "epoch": 0.24, "learning_rate": 4.436316590431938e-06, "loss": 1.2316, "step": 8015 }, { "epoch": 0.24, "learning_rate": 4.436162291712582e-06, "loss": 1.0907, "step": 8016 }, { "epoch": 0.24, "learning_rate": 4.436007974561894e-06, "loss": 1.1115, "step": 8017 }, { "epoch": 0.24, "learning_rate": 4.435853638981343e-06, "loss": 1.2773, "step": 8018 }, { "epoch": 0.24, "learning_rate": 4.4356992849723965e-06, "loss": 1.1716, "step": 8019 }, { "epoch": 0.24, "learning_rate": 4.4355449125365255e-06, "loss": 1.2233, "step": 8020 }, { "epoch": 0.24, "learning_rate": 4.435390521675199e-06, "loss": 1.0585, "step": 8021 }, { "epoch": 0.24, "learning_rate": 4.435236112389888e-06, "loss": 1.1956, "step": 8022 }, { "epoch": 0.24, "learning_rate": 4.43508168468206e-06, "loss": 1.2044, "step": 8023 }, { "epoch": 0.24, "learning_rate": 4.434927238553186e-06, "loss": 1.2375, "step": 8024 }, { "epoch": 0.24, "learning_rate": 4.4347727740047375e-06, "loss": 1.1332, "step": 8025 }, { "epoch": 0.24, "learning_rate": 4.4346182910381845e-06, "loss": 1.1552, "step": 8026 }, { "epoch": 0.24, "learning_rate": 4.434463789654996e-06, "loss": 1.152, "step": 8027 }, { "epoch": 0.24, "learning_rate": 4.434309269856644e-06, "loss": 1.1022, "step": 8028 }, { "epoch": 0.24, "learning_rate": 4.4341547316446e-06, "loss": 1.2076, "step": 8029 }, { "epoch": 0.24, "learning_rate": 4.434000175020334e-06, "loss": 1.2782, "step": 8030 }, { "epoch": 0.24, "learning_rate": 4.4338455999853176e-06, "loss": 1.1791, "step": 8031 }, { "epoch": 0.24, "learning_rate": 4.433691006541023e-06, "loss": 1.0434, "step": 8032 }, { "epoch": 0.24, "learning_rate": 4.433536394688921e-06, "loss": 1.1109, "step": 8033 }, { "epoch": 0.24, "learning_rate": 4.4333817644304834e-06, "loss": 1.0406, "step": 8034 }, { "epoch": 0.24, "learning_rate": 4.433227115767183e-06, "loss": 1.1707, "step": 8035 }, { "epoch": 0.24, "learning_rate": 4.433072448700492e-06, "loss": 1.1721, "step": 8036 }, { "epoch": 0.24, "learning_rate": 4.432917763231881e-06, "loss": 1.2971, "step": 8037 }, { "epoch": 0.24, "learning_rate": 4.432763059362825e-06, "loss": 1.097, "step": 8038 }, { "epoch": 0.24, "learning_rate": 4.432608337094795e-06, "loss": 1.1282, "step": 8039 }, { "epoch": 0.24, "learning_rate": 4.432453596429265e-06, "loss": 1.0529, "step": 8040 }, { "epoch": 0.24, "learning_rate": 4.432298837367707e-06, "loss": 1.1046, "step": 8041 }, { "epoch": 0.24, "learning_rate": 4.432144059911595e-06, "loss": 1.2341, "step": 8042 }, { "epoch": 0.24, "learning_rate": 4.431989264062401e-06, "loss": 1.2748, "step": 8043 }, { "epoch": 0.24, "learning_rate": 4.4318344498216e-06, "loss": 1.0856, "step": 8044 }, { "epoch": 0.24, "learning_rate": 4.431679617190667e-06, "loss": 1.1339, "step": 8045 }, { "epoch": 0.24, "learning_rate": 4.431524766171073e-06, "loss": 1.0223, "step": 8046 }, { "epoch": 0.24, "learning_rate": 4.431369896764294e-06, "loss": 1.1754, "step": 8047 }, { "epoch": 0.24, "learning_rate": 4.431215008971803e-06, "loss": 1.0849, "step": 8048 }, { "epoch": 0.24, "learning_rate": 4.431060102795076e-06, "loss": 1.1964, "step": 8049 }, { "epoch": 0.24, "learning_rate": 4.430905178235586e-06, "loss": 1.0989, "step": 8050 }, { "epoch": 0.24, "learning_rate": 4.43075023529481e-06, "loss": 1.1728, "step": 8051 }, { "epoch": 0.24, "learning_rate": 4.4305952739742205e-06, "loss": 1.0834, "step": 8052 }, { "epoch": 0.24, "learning_rate": 4.430440294275295e-06, "loss": 1.1642, "step": 8053 }, { "epoch": 0.24, "learning_rate": 4.430285296199506e-06, "loss": 1.055, "step": 8054 }, { "epoch": 0.24, "learning_rate": 4.430130279748331e-06, "loss": 1.1239, "step": 8055 }, { "epoch": 0.24, "learning_rate": 4.429975244923247e-06, "loss": 1.1863, "step": 8056 }, { "epoch": 0.24, "learning_rate": 4.429820191725726e-06, "loss": 1.1256, "step": 8057 }, { "epoch": 0.24, "learning_rate": 4.429665120157247e-06, "loss": 1.0743, "step": 8058 }, { "epoch": 0.24, "learning_rate": 4.4295100302192865e-06, "loss": 1.0575, "step": 8059 }, { "epoch": 0.24, "learning_rate": 4.429354921913318e-06, "loss": 1.0447, "step": 8060 }, { "epoch": 0.24, "learning_rate": 4.429199795240821e-06, "loss": 1.1481, "step": 8061 }, { "epoch": 0.24, "learning_rate": 4.42904465020327e-06, "loss": 1.3103, "step": 8062 }, { "epoch": 0.24, "learning_rate": 4.428889486802145e-06, "loss": 1.1431, "step": 8063 }, { "epoch": 0.24, "learning_rate": 4.42873430503892e-06, "loss": 1.1853, "step": 8064 }, { "epoch": 0.24, "learning_rate": 4.428579104915072e-06, "loss": 1.1296, "step": 8065 }, { "epoch": 0.24, "learning_rate": 4.428423886432082e-06, "loss": 1.1759, "step": 8066 }, { "epoch": 0.24, "learning_rate": 4.428268649591424e-06, "loss": 1.1272, "step": 8067 }, { "epoch": 0.24, "learning_rate": 4.428113394394578e-06, "loss": 1.1377, "step": 8068 }, { "epoch": 0.24, "learning_rate": 4.42795812084302e-06, "loss": 1.1102, "step": 8069 }, { "epoch": 0.24, "learning_rate": 4.4278028289382295e-06, "loss": 1.14, "step": 8070 }, { "epoch": 0.24, "learning_rate": 4.427647518681685e-06, "loss": 1.1193, "step": 8071 }, { "epoch": 0.24, "learning_rate": 4.427492190074864e-06, "loss": 1.1371, "step": 8072 }, { "epoch": 0.24, "learning_rate": 4.427336843119247e-06, "loss": 1.1761, "step": 8073 }, { "epoch": 0.24, "learning_rate": 4.4271814778163096e-06, "loss": 1.2954, "step": 8074 }, { "epoch": 0.24, "learning_rate": 4.427026094167534e-06, "loss": 1.15, "step": 8075 }, { "epoch": 0.24, "learning_rate": 4.426870692174397e-06, "loss": 1.1761, "step": 8076 }, { "epoch": 0.24, "learning_rate": 4.42671527183838e-06, "loss": 1.077, "step": 8077 }, { "epoch": 0.24, "learning_rate": 4.426559833160961e-06, "loss": 1.1414, "step": 8078 }, { "epoch": 0.24, "learning_rate": 4.426404376143621e-06, "loss": 1.1417, "step": 8079 }, { "epoch": 0.24, "learning_rate": 4.426248900787838e-06, "loss": 1.0883, "step": 8080 }, { "epoch": 0.24, "learning_rate": 4.426093407095095e-06, "loss": 1.1419, "step": 8081 }, { "epoch": 0.24, "learning_rate": 4.425937895066868e-06, "loss": 1.202, "step": 8082 }, { "epoch": 0.24, "learning_rate": 4.425782364704642e-06, "loss": 1.1241, "step": 8083 }, { "epoch": 0.24, "learning_rate": 4.425626816009894e-06, "loss": 1.1582, "step": 8084 }, { "epoch": 0.24, "learning_rate": 4.425471248984106e-06, "loss": 1.2221, "step": 8085 }, { "epoch": 0.24, "learning_rate": 4.42531566362876e-06, "loss": 1.248, "step": 8086 }, { "epoch": 0.24, "learning_rate": 4.425160059945335e-06, "loss": 1.0651, "step": 8087 }, { "epoch": 0.24, "learning_rate": 4.425004437935314e-06, "loss": 1.1818, "step": 8088 }, { "epoch": 0.24, "learning_rate": 4.424848797600179e-06, "loss": 1.0873, "step": 8089 }, { "epoch": 0.24, "learning_rate": 4.424693138941409e-06, "loss": 1.1189, "step": 8090 }, { "epoch": 0.24, "learning_rate": 4.424537461960488e-06, "loss": 1.1472, "step": 8091 }, { "epoch": 0.24, "learning_rate": 4.424381766658896e-06, "loss": 1.1208, "step": 8092 }, { "epoch": 0.24, "learning_rate": 4.424226053038118e-06, "loss": 1.1375, "step": 8093 }, { "epoch": 0.24, "learning_rate": 4.424070321099634e-06, "loss": 1.226, "step": 8094 }, { "epoch": 0.24, "learning_rate": 4.4239145708449275e-06, "loss": 1.0613, "step": 8095 }, { "epoch": 0.24, "learning_rate": 4.423758802275481e-06, "loss": 1.094, "step": 8096 }, { "epoch": 0.24, "learning_rate": 4.423603015392777e-06, "loss": 1.124, "step": 8097 }, { "epoch": 0.24, "learning_rate": 4.423447210198298e-06, "loss": 1.1565, "step": 8098 }, { "epoch": 0.24, "learning_rate": 4.423291386693528e-06, "loss": 1.1765, "step": 8099 }, { "epoch": 0.24, "learning_rate": 4.4231355448799514e-06, "loss": 1.1245, "step": 8100 }, { "epoch": 0.24, "learning_rate": 4.42297968475905e-06, "loss": 1.1304, "step": 8101 }, { "epoch": 0.24, "learning_rate": 4.422823806332308e-06, "loss": 1.0903, "step": 8102 }, { "epoch": 0.24, "learning_rate": 4.42266790960121e-06, "loss": 1.1526, "step": 8103 }, { "epoch": 0.24, "learning_rate": 4.422511994567239e-06, "loss": 1.1605, "step": 8104 }, { "epoch": 0.24, "learning_rate": 4.4223560612318795e-06, "loss": 1.2169, "step": 8105 }, { "epoch": 0.24, "learning_rate": 4.422200109596616e-06, "loss": 1.1373, "step": 8106 }, { "epoch": 0.24, "learning_rate": 4.422044139662934e-06, "loss": 1.1785, "step": 8107 }, { "epoch": 0.24, "learning_rate": 4.421888151432318e-06, "loss": 1.2105, "step": 8108 }, { "epoch": 0.24, "learning_rate": 4.421732144906251e-06, "loss": 1.176, "step": 8109 }, { "epoch": 0.24, "learning_rate": 4.42157612008622e-06, "loss": 1.2693, "step": 8110 }, { "epoch": 0.24, "learning_rate": 4.42142007697371e-06, "loss": 1.2548, "step": 8111 }, { "epoch": 0.24, "learning_rate": 4.4212640155702056e-06, "loss": 1.2562, "step": 8112 }, { "epoch": 0.24, "learning_rate": 4.4211079358771945e-06, "loss": 1.187, "step": 8113 }, { "epoch": 0.24, "learning_rate": 4.42095183789616e-06, "loss": 1.2155, "step": 8114 }, { "epoch": 0.24, "learning_rate": 4.420795721628589e-06, "loss": 1.0437, "step": 8115 }, { "epoch": 0.24, "learning_rate": 4.420639587075969e-06, "loss": 1.1505, "step": 8116 }, { "epoch": 0.24, "learning_rate": 4.420483434239784e-06, "loss": 1.2192, "step": 8117 }, { "epoch": 0.24, "learning_rate": 4.420327263121522e-06, "loss": 1.1306, "step": 8118 }, { "epoch": 0.24, "learning_rate": 4.420171073722669e-06, "loss": 1.1, "step": 8119 }, { "epoch": 0.24, "learning_rate": 4.420014866044713e-06, "loss": 1.1251, "step": 8120 }, { "epoch": 0.24, "learning_rate": 4.41985864008914e-06, "loss": 1.1, "step": 8121 }, { "epoch": 0.24, "learning_rate": 4.419702395857437e-06, "loss": 1.1216, "step": 8122 }, { "epoch": 0.24, "learning_rate": 4.419546133351091e-06, "loss": 1.1393, "step": 8123 }, { "epoch": 0.24, "learning_rate": 4.419389852571592e-06, "loss": 1.0246, "step": 8124 }, { "epoch": 0.24, "learning_rate": 4.419233553520425e-06, "loss": 1.2021, "step": 8125 }, { "epoch": 0.24, "learning_rate": 4.419077236199078e-06, "loss": 1.1174, "step": 8126 }, { "epoch": 0.24, "learning_rate": 4.418920900609041e-06, "loss": 1.231, "step": 8127 }, { "epoch": 0.24, "learning_rate": 4.418764546751802e-06, "loss": 0.9951, "step": 8128 }, { "epoch": 0.24, "learning_rate": 4.418608174628847e-06, "loss": 1.1029, "step": 8129 }, { "epoch": 0.24, "learning_rate": 4.4184517842416675e-06, "loss": 1.144, "step": 8130 }, { "epoch": 0.24, "learning_rate": 4.41829537559175e-06, "loss": 1.2591, "step": 8131 }, { "epoch": 0.24, "learning_rate": 4.4181389486805846e-06, "loss": 1.0481, "step": 8132 }, { "epoch": 0.25, "learning_rate": 4.417982503509661e-06, "loss": 1.1017, "step": 8133 }, { "epoch": 0.25, "learning_rate": 4.417826040080467e-06, "loss": 1.0841, "step": 8134 }, { "epoch": 0.25, "learning_rate": 4.417669558394494e-06, "loss": 1.0522, "step": 8135 }, { "epoch": 0.25, "learning_rate": 4.417513058453229e-06, "loss": 1.1411, "step": 8136 }, { "epoch": 0.25, "learning_rate": 4.417356540258163e-06, "loss": 1.0753, "step": 8137 }, { "epoch": 0.25, "learning_rate": 4.417200003810787e-06, "loss": 1.0696, "step": 8138 }, { "epoch": 0.25, "learning_rate": 4.41704344911259e-06, "loss": 1.1808, "step": 8139 }, { "epoch": 0.25, "learning_rate": 4.416886876165062e-06, "loss": 1.1295, "step": 8140 }, { "epoch": 0.25, "learning_rate": 4.416730284969695e-06, "loss": 1.2097, "step": 8141 }, { "epoch": 0.25, "learning_rate": 4.416573675527979e-06, "loss": 1.1305, "step": 8142 }, { "epoch": 0.25, "learning_rate": 4.416417047841404e-06, "loss": 1.2, "step": 8143 }, { "epoch": 0.25, "learning_rate": 4.416260401911463e-06, "loss": 1.192, "step": 8144 }, { "epoch": 0.25, "learning_rate": 4.416103737739645e-06, "loss": 1.1106, "step": 8145 }, { "epoch": 0.25, "learning_rate": 4.4159470553274405e-06, "loss": 1.1282, "step": 8146 }, { "epoch": 0.25, "learning_rate": 4.4157903546763445e-06, "loss": 1.1246, "step": 8147 }, { "epoch": 0.25, "learning_rate": 4.415633635787848e-06, "loss": 1.2902, "step": 8148 }, { "epoch": 0.25, "learning_rate": 4.4154768986634396e-06, "loss": 1.1959, "step": 8149 }, { "epoch": 0.25, "learning_rate": 4.415320143304616e-06, "loss": 1.075, "step": 8150 }, { "epoch": 0.25, "learning_rate": 4.4151633697128656e-06, "loss": 1.2281, "step": 8151 }, { "epoch": 0.25, "learning_rate": 4.4150065778896824e-06, "loss": 1.036, "step": 8152 }, { "epoch": 0.25, "learning_rate": 4.41484976783656e-06, "loss": 1.0776, "step": 8153 }, { "epoch": 0.25, "learning_rate": 4.414692939554988e-06, "loss": 1.2093, "step": 8154 }, { "epoch": 0.25, "learning_rate": 4.4145360930464625e-06, "loss": 1.1767, "step": 8155 }, { "epoch": 0.25, "learning_rate": 4.414379228312476e-06, "loss": 1.2219, "step": 8156 }, { "epoch": 0.25, "learning_rate": 4.41422234535452e-06, "loss": 1.1959, "step": 8157 }, { "epoch": 0.25, "learning_rate": 4.41406544417409e-06, "loss": 1.161, "step": 8158 }, { "epoch": 0.25, "learning_rate": 4.413908524772679e-06, "loss": 1.1547, "step": 8159 }, { "epoch": 0.25, "learning_rate": 4.41375158715178e-06, "loss": 1.1699, "step": 8160 }, { "epoch": 0.25, "learning_rate": 4.413594631312888e-06, "loss": 1.1525, "step": 8161 }, { "epoch": 0.25, "learning_rate": 4.413437657257497e-06, "loss": 1.1572, "step": 8162 }, { "epoch": 0.25, "learning_rate": 4.413280664987101e-06, "loss": 1.0768, "step": 8163 }, { "epoch": 0.25, "learning_rate": 4.413123654503193e-06, "loss": 1.1473, "step": 8164 }, { "epoch": 0.25, "learning_rate": 4.412966625807271e-06, "loss": 1.1757, "step": 8165 }, { "epoch": 0.25, "learning_rate": 4.412809578900827e-06, "loss": 1.1992, "step": 8166 }, { "epoch": 0.25, "learning_rate": 4.412652513785358e-06, "loss": 1.203, "step": 8167 }, { "epoch": 0.25, "learning_rate": 4.412495430462358e-06, "loss": 1.1783, "step": 8168 }, { "epoch": 0.25, "learning_rate": 4.412338328933322e-06, "loss": 1.1821, "step": 8169 }, { "epoch": 0.25, "learning_rate": 4.412181209199746e-06, "loss": 1.1238, "step": 8170 }, { "epoch": 0.25, "learning_rate": 4.412024071263127e-06, "loss": 1.0764, "step": 8171 }, { "epoch": 0.25, "learning_rate": 4.411866915124959e-06, "loss": 1.1716, "step": 8172 }, { "epoch": 0.25, "learning_rate": 4.411709740786738e-06, "loss": 1.1074, "step": 8173 }, { "epoch": 0.25, "learning_rate": 4.4115525482499625e-06, "loss": 1.1932, "step": 8174 }, { "epoch": 0.25, "learning_rate": 4.411395337516126e-06, "loss": 1.1805, "step": 8175 }, { "epoch": 0.25, "learning_rate": 4.411238108586727e-06, "loss": 1.1371, "step": 8176 }, { "epoch": 0.25, "learning_rate": 4.411080861463262e-06, "loss": 1.2319, "step": 8177 }, { "epoch": 0.25, "learning_rate": 4.410923596147227e-06, "loss": 1.1094, "step": 8178 }, { "epoch": 0.25, "learning_rate": 4.41076631264012e-06, "loss": 1.1132, "step": 8179 }, { "epoch": 0.25, "learning_rate": 4.410609010943439e-06, "loss": 1.155, "step": 8180 }, { "epoch": 0.25, "learning_rate": 4.410451691058679e-06, "loss": 1.1743, "step": 8181 }, { "epoch": 0.25, "learning_rate": 4.410294352987339e-06, "loss": 1.0682, "step": 8182 }, { "epoch": 0.25, "learning_rate": 4.410136996730917e-06, "loss": 1.1361, "step": 8183 }, { "epoch": 0.25, "learning_rate": 4.409979622290911e-06, "loss": 1.136, "step": 8184 }, { "epoch": 0.25, "learning_rate": 4.409822229668819e-06, "loss": 1.1327, "step": 8185 }, { "epoch": 0.25, "learning_rate": 4.409664818866139e-06, "loss": 1.2369, "step": 8186 }, { "epoch": 0.25, "learning_rate": 4.40950738988437e-06, "loss": 1.1357, "step": 8187 }, { "epoch": 0.25, "learning_rate": 4.40934994272501e-06, "loss": 1.2925, "step": 8188 }, { "epoch": 0.25, "learning_rate": 4.409192477389558e-06, "loss": 1.2079, "step": 8189 }, { "epoch": 0.25, "learning_rate": 4.409034993879513e-06, "loss": 1.224, "step": 8190 }, { "epoch": 0.25, "learning_rate": 4.408877492196374e-06, "loss": 1.0992, "step": 8191 }, { "epoch": 0.25, "learning_rate": 4.40871997234164e-06, "loss": 1.1313, "step": 8192 }, { "epoch": 0.25, "learning_rate": 4.4085624343168135e-06, "loss": 1.2179, "step": 8193 }, { "epoch": 0.25, "learning_rate": 4.40840487812339e-06, "loss": 1.1684, "step": 8194 }, { "epoch": 0.25, "learning_rate": 4.408247303762872e-06, "loss": 1.1437, "step": 8195 }, { "epoch": 0.25, "learning_rate": 4.408089711236758e-06, "loss": 1.1318, "step": 8196 }, { "epoch": 0.25, "learning_rate": 4.4079321005465494e-06, "loss": 1.0892, "step": 8197 }, { "epoch": 0.25, "learning_rate": 4.407774471693747e-06, "loss": 1.2199, "step": 8198 }, { "epoch": 0.25, "learning_rate": 4.407616824679849e-06, "loss": 1.214, "step": 8199 }, { "epoch": 0.25, "learning_rate": 4.4074591595063575e-06, "loss": 1.2383, "step": 8200 }, { "epoch": 0.25, "learning_rate": 4.407301476174774e-06, "loss": 1.2753, "step": 8201 }, { "epoch": 0.25, "learning_rate": 4.4071437746866e-06, "loss": 1.1176, "step": 8202 }, { "epoch": 0.25, "learning_rate": 4.4069860550433345e-06, "loss": 1.2004, "step": 8203 }, { "epoch": 0.25, "learning_rate": 4.40682831724648e-06, "loss": 1.1729, "step": 8204 }, { "epoch": 0.25, "learning_rate": 4.406670561297539e-06, "loss": 1.1278, "step": 8205 }, { "epoch": 0.25, "learning_rate": 4.4065127871980126e-06, "loss": 1.3109, "step": 8206 }, { "epoch": 0.25, "learning_rate": 4.406354994949402e-06, "loss": 1.194, "step": 8207 }, { "epoch": 0.25, "learning_rate": 4.40619718455321e-06, "loss": 1.1125, "step": 8208 }, { "epoch": 0.25, "learning_rate": 4.406039356010939e-06, "loss": 1.1163, "step": 8209 }, { "epoch": 0.25, "learning_rate": 4.405881509324093e-06, "loss": 1.1642, "step": 8210 }, { "epoch": 0.25, "learning_rate": 4.405723644494171e-06, "loss": 1.297, "step": 8211 }, { "epoch": 0.25, "learning_rate": 4.405565761522677e-06, "loss": 1.0835, "step": 8212 }, { "epoch": 0.25, "learning_rate": 4.405407860411117e-06, "loss": 1.0989, "step": 8213 }, { "epoch": 0.25, "learning_rate": 4.405249941160991e-06, "loss": 1.1122, "step": 8214 }, { "epoch": 0.25, "learning_rate": 4.405092003773802e-06, "loss": 1.1249, "step": 8215 }, { "epoch": 0.25, "learning_rate": 4.404934048251056e-06, "loss": 1.0598, "step": 8216 }, { "epoch": 0.25, "learning_rate": 4.404776074594255e-06, "loss": 1.136, "step": 8217 }, { "epoch": 0.25, "learning_rate": 4.404618082804903e-06, "loss": 1.0652, "step": 8218 }, { "epoch": 0.25, "learning_rate": 4.404460072884505e-06, "loss": 1.097, "step": 8219 }, { "epoch": 0.25, "learning_rate": 4.404302044834563e-06, "loss": 1.1173, "step": 8220 }, { "epoch": 0.25, "learning_rate": 4.404143998656582e-06, "loss": 1.1498, "step": 8221 }, { "epoch": 0.25, "learning_rate": 4.403985934352069e-06, "loss": 1.2197, "step": 8222 }, { "epoch": 0.25, "learning_rate": 4.403827851922526e-06, "loss": 1.0848, "step": 8223 }, { "epoch": 0.25, "learning_rate": 4.40366975136946e-06, "loss": 1.1556, "step": 8224 }, { "epoch": 0.25, "learning_rate": 4.403511632694373e-06, "loss": 1.0685, "step": 8225 }, { "epoch": 0.25, "learning_rate": 4.4033534958987736e-06, "loss": 1.2018, "step": 8226 }, { "epoch": 0.25, "learning_rate": 4.403195340984164e-06, "loss": 1.1676, "step": 8227 }, { "epoch": 0.25, "learning_rate": 4.403037167952052e-06, "loss": 1.0922, "step": 8228 }, { "epoch": 0.25, "learning_rate": 4.402878976803943e-06, "loss": 1.2458, "step": 8229 }, { "epoch": 0.25, "learning_rate": 4.402720767541343e-06, "loss": 1.1539, "step": 8230 }, { "epoch": 0.25, "learning_rate": 4.402562540165757e-06, "loss": 1.1722, "step": 8231 }, { "epoch": 0.25, "learning_rate": 4.402404294678692e-06, "loss": 1.1423, "step": 8232 }, { "epoch": 0.25, "learning_rate": 4.402246031081655e-06, "loss": 1.0959, "step": 8233 }, { "epoch": 0.25, "learning_rate": 4.402087749376151e-06, "loss": 1.1115, "step": 8234 }, { "epoch": 0.25, "learning_rate": 4.4019294495636874e-06, "loss": 1.0684, "step": 8235 }, { "epoch": 0.25, "learning_rate": 4.401771131645773e-06, "loss": 1.1495, "step": 8236 }, { "epoch": 0.25, "learning_rate": 4.401612795623912e-06, "loss": 1.2072, "step": 8237 }, { "epoch": 0.25, "learning_rate": 4.401454441499614e-06, "loss": 1.2517, "step": 8238 }, { "epoch": 0.25, "learning_rate": 4.401296069274384e-06, "loss": 1.1802, "step": 8239 }, { "epoch": 0.25, "learning_rate": 4.401137678949733e-06, "loss": 1.1091, "step": 8240 }, { "epoch": 0.25, "learning_rate": 4.400979270527166e-06, "loss": 1.076, "step": 8241 }, { "epoch": 0.25, "learning_rate": 4.400820844008192e-06, "loss": 1.1211, "step": 8242 }, { "epoch": 0.25, "learning_rate": 4.400662399394319e-06, "loss": 1.1066, "step": 8243 }, { "epoch": 0.25, "learning_rate": 4.400503936687055e-06, "loss": 1.1049, "step": 8244 }, { "epoch": 0.25, "learning_rate": 4.400345455887909e-06, "loss": 1.0903, "step": 8245 }, { "epoch": 0.25, "learning_rate": 4.4001869569983905e-06, "loss": 1.1213, "step": 8246 }, { "epoch": 0.25, "learning_rate": 4.400028440020006e-06, "loss": 1.2258, "step": 8247 }, { "epoch": 0.25, "learning_rate": 4.399869904954266e-06, "loss": 1.1556, "step": 8248 }, { "epoch": 0.25, "learning_rate": 4.39971135180268e-06, "loss": 1.1173, "step": 8249 }, { "epoch": 0.25, "learning_rate": 4.399552780566757e-06, "loss": 1.1046, "step": 8250 }, { "epoch": 0.25, "learning_rate": 4.399394191248006e-06, "loss": 1.1777, "step": 8251 }, { "epoch": 0.25, "learning_rate": 4.399235583847937e-06, "loss": 1.1523, "step": 8252 }, { "epoch": 0.25, "learning_rate": 4.39907695836806e-06, "loss": 1.0712, "step": 8253 }, { "epoch": 0.25, "learning_rate": 4.398918314809885e-06, "loss": 1.176, "step": 8254 }, { "epoch": 0.25, "learning_rate": 4.398759653174922e-06, "loss": 1.2841, "step": 8255 }, { "epoch": 0.25, "learning_rate": 4.398600973464682e-06, "loss": 1.2221, "step": 8256 }, { "epoch": 0.25, "learning_rate": 4.398442275680675e-06, "loss": 1.1462, "step": 8257 }, { "epoch": 0.25, "learning_rate": 4.398283559824412e-06, "loss": 1.1848, "step": 8258 }, { "epoch": 0.25, "learning_rate": 4.3981248258974035e-06, "loss": 1.1458, "step": 8259 }, { "epoch": 0.25, "learning_rate": 4.397966073901161e-06, "loss": 1.1316, "step": 8260 }, { "epoch": 0.25, "learning_rate": 4.397807303837195e-06, "loss": 1.2596, "step": 8261 }, { "epoch": 0.25, "learning_rate": 4.397648515707018e-06, "loss": 1.2756, "step": 8262 }, { "epoch": 0.25, "learning_rate": 4.397489709512141e-06, "loss": 1.1971, "step": 8263 }, { "epoch": 0.25, "learning_rate": 4.397330885254076e-06, "loss": 1.1833, "step": 8264 }, { "epoch": 0.25, "learning_rate": 4.397172042934335e-06, "loss": 1.1823, "step": 8265 }, { "epoch": 0.25, "learning_rate": 4.397013182554429e-06, "loss": 0.9354, "step": 8266 }, { "epoch": 0.25, "learning_rate": 4.396854304115872e-06, "loss": 1.1107, "step": 8267 }, { "epoch": 0.25, "learning_rate": 4.396695407620175e-06, "loss": 1.0929, "step": 8268 }, { "epoch": 0.25, "learning_rate": 4.396536493068851e-06, "loss": 1.1894, "step": 8269 }, { "epoch": 0.25, "learning_rate": 4.396377560463414e-06, "loss": 1.1398, "step": 8270 }, { "epoch": 0.25, "learning_rate": 4.3962186098053754e-06, "loss": 1.181, "step": 8271 }, { "epoch": 0.25, "learning_rate": 4.396059641096249e-06, "loss": 1.1603, "step": 8272 }, { "epoch": 0.25, "learning_rate": 4.3959006543375475e-06, "loss": 1.2336, "step": 8273 }, { "epoch": 0.25, "learning_rate": 4.3957416495307855e-06, "loss": 1.1469, "step": 8274 }, { "epoch": 0.25, "learning_rate": 4.395582626677476e-06, "loss": 1.1716, "step": 8275 }, { "epoch": 0.25, "learning_rate": 4.395423585779132e-06, "loss": 1.1467, "step": 8276 }, { "epoch": 0.25, "learning_rate": 4.395264526837269e-06, "loss": 1.2175, "step": 8277 }, { "epoch": 0.25, "learning_rate": 4.3951054498534e-06, "loss": 1.0297, "step": 8278 }, { "epoch": 0.25, "learning_rate": 4.3949463548290406e-06, "loss": 1.0987, "step": 8279 }, { "epoch": 0.25, "learning_rate": 4.394787241765705e-06, "loss": 1.2748, "step": 8280 }, { "epoch": 0.25, "learning_rate": 4.3946281106649055e-06, "loss": 1.2102, "step": 8281 }, { "epoch": 0.25, "learning_rate": 4.39446896152816e-06, "loss": 1.1979, "step": 8282 }, { "epoch": 0.25, "learning_rate": 4.394309794356982e-06, "loss": 1.2145, "step": 8283 }, { "epoch": 0.25, "learning_rate": 4.394150609152887e-06, "loss": 1.0607, "step": 8284 }, { "epoch": 0.25, "learning_rate": 4.3939914059173916e-06, "loss": 1.1996, "step": 8285 }, { "epoch": 0.25, "learning_rate": 4.39383218465201e-06, "loss": 1.1971, "step": 8286 }, { "epoch": 0.25, "learning_rate": 4.393672945358257e-06, "loss": 1.0679, "step": 8287 }, { "epoch": 0.25, "learning_rate": 4.393513688037651e-06, "loss": 1.0744, "step": 8288 }, { "epoch": 0.25, "learning_rate": 4.393354412691705e-06, "loss": 1.0529, "step": 8289 }, { "epoch": 0.25, "learning_rate": 4.393195119321937e-06, "loss": 1.0687, "step": 8290 }, { "epoch": 0.25, "learning_rate": 4.393035807929864e-06, "loss": 1.1592, "step": 8291 }, { "epoch": 0.25, "learning_rate": 4.392876478517002e-06, "loss": 1.236, "step": 8292 }, { "epoch": 0.25, "learning_rate": 4.3927171310848675e-06, "loss": 1.1788, "step": 8293 }, { "epoch": 0.25, "learning_rate": 4.3925577656349775e-06, "loss": 1.1663, "step": 8294 }, { "epoch": 0.25, "learning_rate": 4.392398382168848e-06, "loss": 1.0737, "step": 8295 }, { "epoch": 0.25, "learning_rate": 4.392238980687999e-06, "loss": 1.1094, "step": 8296 }, { "epoch": 0.25, "learning_rate": 4.392079561193945e-06, "loss": 1.2108, "step": 8297 }, { "epoch": 0.25, "learning_rate": 4.3919201236882055e-06, "loss": 1.1069, "step": 8298 }, { "epoch": 0.25, "learning_rate": 4.391760668172297e-06, "loss": 1.1036, "step": 8299 }, { "epoch": 0.25, "learning_rate": 4.391601194647738e-06, "loss": 1.0792, "step": 8300 }, { "epoch": 0.25, "learning_rate": 4.391441703116047e-06, "loss": 1.1243, "step": 8301 }, { "epoch": 0.25, "learning_rate": 4.391282193578743e-06, "loss": 1.1033, "step": 8302 }, { "epoch": 0.25, "learning_rate": 4.3911226660373415e-06, "loss": 1.1099, "step": 8303 }, { "epoch": 0.25, "learning_rate": 4.390963120493364e-06, "loss": 1.1313, "step": 8304 }, { "epoch": 0.25, "learning_rate": 4.390803556948328e-06, "loss": 1.1547, "step": 8305 }, { "epoch": 0.25, "learning_rate": 4.390643975403753e-06, "loss": 1.1194, "step": 8306 }, { "epoch": 0.25, "learning_rate": 4.390484375861158e-06, "loss": 1.1954, "step": 8307 }, { "epoch": 0.25, "learning_rate": 4.390324758322062e-06, "loss": 1.1984, "step": 8308 }, { "epoch": 0.25, "learning_rate": 4.390165122787985e-06, "loss": 1.1837, "step": 8309 }, { "epoch": 0.25, "learning_rate": 4.390005469260446e-06, "loss": 1.0678, "step": 8310 }, { "epoch": 0.25, "learning_rate": 4.389845797740966e-06, "loss": 1.2194, "step": 8311 }, { "epoch": 0.25, "learning_rate": 4.389686108231063e-06, "loss": 1.0826, "step": 8312 }, { "epoch": 0.25, "learning_rate": 4.389526400732259e-06, "loss": 1.1927, "step": 8313 }, { "epoch": 0.25, "learning_rate": 4.3893666752460734e-06, "loss": 1.1677, "step": 8314 }, { "epoch": 0.25, "learning_rate": 4.389206931774027e-06, "loss": 1.1147, "step": 8315 }, { "epoch": 0.25, "learning_rate": 4.38904717031764e-06, "loss": 1.118, "step": 8316 }, { "epoch": 0.25, "learning_rate": 4.388887390878435e-06, "loss": 1.0942, "step": 8317 }, { "epoch": 0.25, "learning_rate": 4.388727593457932e-06, "loss": 1.1287, "step": 8318 }, { "epoch": 0.25, "learning_rate": 4.388567778057651e-06, "loss": 1.0519, "step": 8319 }, { "epoch": 0.25, "learning_rate": 4.388407944679114e-06, "loss": 1.1226, "step": 8320 }, { "epoch": 0.25, "learning_rate": 4.388248093323843e-06, "loss": 1.0549, "step": 8321 }, { "epoch": 0.25, "learning_rate": 4.38808822399336e-06, "loss": 1.2006, "step": 8322 }, { "epoch": 0.25, "learning_rate": 4.387928336689187e-06, "loss": 1.2427, "step": 8323 }, { "epoch": 0.25, "learning_rate": 4.387768431412844e-06, "loss": 1.245, "step": 8324 }, { "epoch": 0.25, "learning_rate": 4.387608508165856e-06, "loss": 1.1844, "step": 8325 }, { "epoch": 0.25, "learning_rate": 4.387448566949743e-06, "loss": 1.1163, "step": 8326 }, { "epoch": 0.25, "learning_rate": 4.38728860776603e-06, "loss": 1.0634, "step": 8327 }, { "epoch": 0.25, "learning_rate": 4.387128630616237e-06, "loss": 1.1695, "step": 8328 }, { "epoch": 0.25, "learning_rate": 4.386968635501889e-06, "loss": 0.9815, "step": 8329 }, { "epoch": 0.25, "learning_rate": 4.386808622424509e-06, "loss": 1.1938, "step": 8330 }, { "epoch": 0.25, "learning_rate": 4.386648591385618e-06, "loss": 1.2159, "step": 8331 }, { "epoch": 0.25, "learning_rate": 4.386488542386743e-06, "loss": 1.0863, "step": 8332 }, { "epoch": 0.25, "learning_rate": 4.386328475429404e-06, "loss": 1.1335, "step": 8333 }, { "epoch": 0.25, "learning_rate": 4.386168390515128e-06, "loss": 1.1245, "step": 8334 }, { "epoch": 0.25, "learning_rate": 4.386008287645436e-06, "loss": 1.058, "step": 8335 }, { "epoch": 0.25, "learning_rate": 4.385848166821854e-06, "loss": 1.2276, "step": 8336 }, { "epoch": 0.25, "learning_rate": 4.385688028045905e-06, "loss": 1.1882, "step": 8337 }, { "epoch": 0.25, "learning_rate": 4.385527871319115e-06, "loss": 1.1602, "step": 8338 }, { "epoch": 0.25, "learning_rate": 4.385367696643007e-06, "loss": 1.1572, "step": 8339 }, { "epoch": 0.25, "learning_rate": 4.3852075040191074e-06, "loss": 1.1541, "step": 8340 }, { "epoch": 0.25, "learning_rate": 4.38504729344894e-06, "loss": 1.0852, "step": 8341 }, { "epoch": 0.25, "learning_rate": 4.384887064934031e-06, "loss": 1.1919, "step": 8342 }, { "epoch": 0.25, "learning_rate": 4.384726818475904e-06, "loss": 1.0302, "step": 8343 }, { "epoch": 0.25, "learning_rate": 4.3845665540760855e-06, "loss": 1.2772, "step": 8344 }, { "epoch": 0.25, "learning_rate": 4.3844062717361e-06, "loss": 1.1672, "step": 8345 }, { "epoch": 0.25, "learning_rate": 4.384245971457476e-06, "loss": 1.1431, "step": 8346 }, { "epoch": 0.25, "learning_rate": 4.384085653241738e-06, "loss": 1.0562, "step": 8347 }, { "epoch": 0.25, "learning_rate": 4.3839253170904105e-06, "loss": 1.1362, "step": 8348 }, { "epoch": 0.25, "learning_rate": 4.383764963005022e-06, "loss": 1.1975, "step": 8349 }, { "epoch": 0.25, "learning_rate": 4.383604590987098e-06, "loss": 1.2782, "step": 8350 }, { "epoch": 0.25, "learning_rate": 4.3834442010381664e-06, "loss": 1.1122, "step": 8351 }, { "epoch": 0.25, "learning_rate": 4.383283793159753e-06, "loss": 1.1748, "step": 8352 }, { "epoch": 0.25, "learning_rate": 4.383123367353383e-06, "loss": 1.0625, "step": 8353 }, { "epoch": 0.25, "learning_rate": 4.382962923620588e-06, "loss": 1.223, "step": 8354 }, { "epoch": 0.25, "learning_rate": 4.382802461962892e-06, "loss": 1.2175, "step": 8355 }, { "epoch": 0.25, "learning_rate": 4.382641982381823e-06, "loss": 1.056, "step": 8356 }, { "epoch": 0.25, "learning_rate": 4.382481484878909e-06, "loss": 1.1315, "step": 8357 }, { "epoch": 0.25, "learning_rate": 4.382320969455678e-06, "loss": 1.1564, "step": 8358 }, { "epoch": 0.25, "learning_rate": 4.3821604361136585e-06, "loss": 1.2266, "step": 8359 }, { "epoch": 0.25, "learning_rate": 4.381999884854377e-06, "loss": 1.1231, "step": 8360 }, { "epoch": 0.25, "learning_rate": 4.381839315679363e-06, "loss": 1.1801, "step": 8361 }, { "epoch": 0.25, "learning_rate": 4.381678728590146e-06, "loss": 1.3735, "step": 8362 }, { "epoch": 0.25, "learning_rate": 4.381518123588254e-06, "loss": 1.0889, "step": 8363 }, { "epoch": 0.25, "learning_rate": 4.381357500675215e-06, "loss": 1.1374, "step": 8364 }, { "epoch": 0.25, "learning_rate": 4.381196859852558e-06, "loss": 1.0287, "step": 8365 }, { "epoch": 0.25, "learning_rate": 4.381036201121814e-06, "loss": 1.1891, "step": 8366 }, { "epoch": 0.25, "learning_rate": 4.380875524484511e-06, "loss": 1.193, "step": 8367 }, { "epoch": 0.25, "learning_rate": 4.380714829942179e-06, "loss": 1.116, "step": 8368 }, { "epoch": 0.25, "learning_rate": 4.380554117496347e-06, "loss": 1.1842, "step": 8369 }, { "epoch": 0.25, "learning_rate": 4.380393387148546e-06, "loss": 1.1441, "step": 8370 }, { "epoch": 0.25, "learning_rate": 4.380232638900305e-06, "loss": 1.0868, "step": 8371 }, { "epoch": 0.25, "learning_rate": 4.380071872753156e-06, "loss": 1.184, "step": 8372 }, { "epoch": 0.25, "learning_rate": 4.3799110887086275e-06, "loss": 1.1326, "step": 8373 }, { "epoch": 0.25, "learning_rate": 4.379750286768251e-06, "loss": 1.1014, "step": 8374 }, { "epoch": 0.25, "learning_rate": 4.3795894669335574e-06, "loss": 1.2012, "step": 8375 }, { "epoch": 0.25, "learning_rate": 4.379428629206076e-06, "loss": 1.1921, "step": 8376 }, { "epoch": 0.25, "learning_rate": 4.379267773587341e-06, "loss": 1.1052, "step": 8377 }, { "epoch": 0.25, "learning_rate": 4.37910690007888e-06, "loss": 1.1567, "step": 8378 }, { "epoch": 0.25, "learning_rate": 4.378946008682228e-06, "loss": 1.1076, "step": 8379 }, { "epoch": 0.25, "learning_rate": 4.378785099398914e-06, "loss": 1.1619, "step": 8380 }, { "epoch": 0.25, "learning_rate": 4.378624172230471e-06, "loss": 1.0612, "step": 8381 }, { "epoch": 0.25, "learning_rate": 4.37846322717843e-06, "loss": 1.0595, "step": 8382 }, { "epoch": 0.25, "learning_rate": 4.378302264244325e-06, "loss": 1.1305, "step": 8383 }, { "epoch": 0.25, "learning_rate": 4.378141283429687e-06, "loss": 1.0624, "step": 8384 }, { "epoch": 0.25, "learning_rate": 4.377980284736047e-06, "loss": 1.0109, "step": 8385 }, { "epoch": 0.25, "learning_rate": 4.377819268164941e-06, "loss": 1.2209, "step": 8386 }, { "epoch": 0.25, "learning_rate": 4.3776582337178986e-06, "loss": 1.1983, "step": 8387 }, { "epoch": 0.25, "learning_rate": 4.377497181396455e-06, "loss": 1.2102, "step": 8388 }, { "epoch": 0.25, "learning_rate": 4.377336111202142e-06, "loss": 1.324, "step": 8389 }, { "epoch": 0.25, "learning_rate": 4.377175023136493e-06, "loss": 1.1224, "step": 8390 }, { "epoch": 0.25, "learning_rate": 4.377013917201043e-06, "loss": 1.1688, "step": 8391 }, { "epoch": 0.25, "learning_rate": 4.376852793397323e-06, "loss": 1.2631, "step": 8392 }, { "epoch": 0.25, "learning_rate": 4.37669165172687e-06, "loss": 1.1136, "step": 8393 }, { "epoch": 0.25, "learning_rate": 4.376530492191215e-06, "loss": 1.0816, "step": 8394 }, { "epoch": 0.25, "learning_rate": 4.376369314791894e-06, "loss": 1.2293, "step": 8395 }, { "epoch": 0.25, "learning_rate": 4.376208119530441e-06, "loss": 1.0955, "step": 8396 }, { "epoch": 0.25, "learning_rate": 4.37604690640839e-06, "loss": 1.2368, "step": 8397 }, { "epoch": 0.25, "learning_rate": 4.375885675427276e-06, "loss": 1.1514, "step": 8398 }, { "epoch": 0.25, "learning_rate": 4.375724426588634e-06, "loss": 1.0447, "step": 8399 }, { "epoch": 0.25, "learning_rate": 4.375563159893998e-06, "loss": 1.1806, "step": 8400 }, { "epoch": 0.25, "learning_rate": 4.375401875344906e-06, "loss": 1.0816, "step": 8401 }, { "epoch": 0.25, "learning_rate": 4.375240572942889e-06, "loss": 1.0107, "step": 8402 }, { "epoch": 0.25, "learning_rate": 4.375079252689487e-06, "loss": 1.1613, "step": 8403 }, { "epoch": 0.25, "learning_rate": 4.374917914586232e-06, "loss": 1.2576, "step": 8404 }, { "epoch": 0.25, "learning_rate": 4.374756558634662e-06, "loss": 1.2253, "step": 8405 }, { "epoch": 0.25, "learning_rate": 4.374595184836313e-06, "loss": 1.2324, "step": 8406 }, { "epoch": 0.25, "learning_rate": 4.3744337931927196e-06, "loss": 1.1229, "step": 8407 }, { "epoch": 0.25, "learning_rate": 4.37427238370542e-06, "loss": 1.1209, "step": 8408 }, { "epoch": 0.25, "learning_rate": 4.37411095637595e-06, "loss": 1.0104, "step": 8409 }, { "epoch": 0.25, "learning_rate": 4.373949511205846e-06, "loss": 1.0221, "step": 8410 }, { "epoch": 0.25, "learning_rate": 4.373788048196646e-06, "loss": 1.1542, "step": 8411 }, { "epoch": 0.25, "learning_rate": 4.373626567349885e-06, "loss": 1.1966, "step": 8412 }, { "epoch": 0.25, "learning_rate": 4.3734650686671025e-06, "loss": 1.2164, "step": 8413 }, { "epoch": 0.25, "learning_rate": 4.373303552149834e-06, "loss": 1.1433, "step": 8414 }, { "epoch": 0.25, "learning_rate": 4.373142017799618e-06, "loss": 1.0576, "step": 8415 }, { "epoch": 0.25, "learning_rate": 4.372980465617993e-06, "loss": 1.064, "step": 8416 }, { "epoch": 0.25, "learning_rate": 4.3728188956064946e-06, "loss": 1.1223, "step": 8417 }, { "epoch": 0.25, "learning_rate": 4.372657307766664e-06, "loss": 1.1879, "step": 8418 }, { "epoch": 0.25, "learning_rate": 4.372495702100036e-06, "loss": 1.0358, "step": 8419 }, { "epoch": 0.25, "learning_rate": 4.372334078608152e-06, "loss": 1.0302, "step": 8420 }, { "epoch": 0.25, "learning_rate": 4.372172437292548e-06, "loss": 1.1104, "step": 8421 }, { "epoch": 0.25, "learning_rate": 4.372010778154765e-06, "loss": 1.0306, "step": 8422 }, { "epoch": 0.25, "learning_rate": 4.371849101196342e-06, "loss": 1.0065, "step": 8423 }, { "epoch": 0.25, "learning_rate": 4.371687406418815e-06, "loss": 1.2729, "step": 8424 }, { "epoch": 0.25, "learning_rate": 4.371525693823727e-06, "loss": 1.1101, "step": 8425 }, { "epoch": 0.25, "learning_rate": 4.371363963412615e-06, "loss": 1.2424, "step": 8426 }, { "epoch": 0.25, "learning_rate": 4.37120221518702e-06, "loss": 1.068, "step": 8427 }, { "epoch": 0.25, "learning_rate": 4.37104044914848e-06, "loss": 0.9944, "step": 8428 }, { "epoch": 0.25, "learning_rate": 4.370878665298537e-06, "loss": 1.111, "step": 8429 }, { "epoch": 0.25, "learning_rate": 4.370716863638729e-06, "loss": 1.0964, "step": 8430 }, { "epoch": 0.25, "learning_rate": 4.370555044170598e-06, "loss": 1.2555, "step": 8431 }, { "epoch": 0.25, "learning_rate": 4.370393206895685e-06, "loss": 1.1248, "step": 8432 }, { "epoch": 0.25, "learning_rate": 4.370231351815528e-06, "loss": 1.1984, "step": 8433 }, { "epoch": 0.25, "learning_rate": 4.37006947893167e-06, "loss": 1.157, "step": 8434 }, { "epoch": 0.25, "learning_rate": 4.36990758824565e-06, "loss": 1.1218, "step": 8435 }, { "epoch": 0.25, "learning_rate": 4.369745679759012e-06, "loss": 1.1957, "step": 8436 }, { "epoch": 0.25, "learning_rate": 4.369583753473295e-06, "loss": 1.0629, "step": 8437 }, { "epoch": 0.25, "learning_rate": 4.369421809390041e-06, "loss": 1.0469, "step": 8438 }, { "epoch": 0.25, "learning_rate": 4.369259847510792e-06, "loss": 1.1277, "step": 8439 }, { "epoch": 0.25, "learning_rate": 4.369097867837089e-06, "loss": 1.2682, "step": 8440 }, { "epoch": 0.25, "learning_rate": 4.368935870370474e-06, "loss": 1.1379, "step": 8441 }, { "epoch": 0.25, "learning_rate": 4.368773855112491e-06, "loss": 1.1389, "step": 8442 }, { "epoch": 0.25, "learning_rate": 4.368611822064681e-06, "loss": 1.1215, "step": 8443 }, { "epoch": 0.25, "learning_rate": 4.368449771228586e-06, "loss": 1.0118, "step": 8444 }, { "epoch": 0.25, "learning_rate": 4.368287702605748e-06, "loss": 1.0916, "step": 8445 }, { "epoch": 0.25, "learning_rate": 4.368125616197711e-06, "loss": 1.1186, "step": 8446 }, { "epoch": 0.25, "learning_rate": 4.367963512006019e-06, "loss": 1.0862, "step": 8447 }, { "epoch": 0.25, "learning_rate": 4.367801390032214e-06, "loss": 1.196, "step": 8448 }, { "epoch": 0.25, "learning_rate": 4.367639250277839e-06, "loss": 1.0728, "step": 8449 }, { "epoch": 0.25, "learning_rate": 4.367477092744437e-06, "loss": 1.134, "step": 8450 }, { "epoch": 0.25, "learning_rate": 4.367314917433553e-06, "loss": 1.2246, "step": 8451 }, { "epoch": 0.25, "learning_rate": 4.367152724346731e-06, "loss": 1.1265, "step": 8452 }, { "epoch": 0.25, "learning_rate": 4.366990513485514e-06, "loss": 1.087, "step": 8453 }, { "epoch": 0.25, "learning_rate": 4.366828284851446e-06, "loss": 1.0467, "step": 8454 }, { "epoch": 0.25, "learning_rate": 4.366666038446072e-06, "loss": 1.1937, "step": 8455 }, { "epoch": 0.25, "learning_rate": 4.366503774270936e-06, "loss": 1.1879, "step": 8456 }, { "epoch": 0.25, "learning_rate": 4.366341492327583e-06, "loss": 1.1787, "step": 8457 }, { "epoch": 0.25, "learning_rate": 4.366179192617559e-06, "loss": 1.0673, "step": 8458 }, { "epoch": 0.25, "learning_rate": 4.366016875142407e-06, "loss": 1.0529, "step": 8459 }, { "epoch": 0.25, "learning_rate": 4.3658545399036736e-06, "loss": 1.1212, "step": 8460 }, { "epoch": 0.25, "learning_rate": 4.365692186902903e-06, "loss": 1.1178, "step": 8461 }, { "epoch": 0.25, "learning_rate": 4.365529816141641e-06, "loss": 1.2444, "step": 8462 }, { "epoch": 0.25, "learning_rate": 4.3653674276214345e-06, "loss": 1.1427, "step": 8463 }, { "epoch": 0.25, "learning_rate": 4.365205021343828e-06, "loss": 1.123, "step": 8464 }, { "epoch": 0.26, "learning_rate": 4.365042597310369e-06, "loss": 1.0818, "step": 8465 }, { "epoch": 0.26, "learning_rate": 4.364880155522602e-06, "loss": 1.1734, "step": 8466 }, { "epoch": 0.26, "learning_rate": 4.364717695982074e-06, "loss": 1.0246, "step": 8467 }, { "epoch": 0.26, "learning_rate": 4.3645552186903315e-06, "loss": 1.2101, "step": 8468 }, { "epoch": 0.26, "learning_rate": 4.3643927236489205e-06, "loss": 1.1708, "step": 8469 }, { "epoch": 0.26, "learning_rate": 4.36423021085939e-06, "loss": 1.1611, "step": 8470 }, { "epoch": 0.26, "learning_rate": 4.364067680323285e-06, "loss": 1.0931, "step": 8471 }, { "epoch": 0.26, "learning_rate": 4.3639051320421545e-06, "loss": 1.0276, "step": 8472 }, { "epoch": 0.26, "learning_rate": 4.363742566017544e-06, "loss": 1.1018, "step": 8473 }, { "epoch": 0.26, "learning_rate": 4.363579982251002e-06, "loss": 1.1649, "step": 8474 }, { "epoch": 0.26, "learning_rate": 4.3634173807440765e-06, "loss": 1.2365, "step": 8475 }, { "epoch": 0.26, "learning_rate": 4.363254761498314e-06, "loss": 1.169, "step": 8476 }, { "epoch": 0.26, "learning_rate": 4.363092124515263e-06, "loss": 1.084, "step": 8477 }, { "epoch": 0.26, "learning_rate": 4.362929469796474e-06, "loss": 0.9954, "step": 8478 }, { "epoch": 0.26, "learning_rate": 4.362766797343494e-06, "loss": 1.173, "step": 8479 }, { "epoch": 0.26, "learning_rate": 4.362604107157869e-06, "loss": 1.2011, "step": 8480 }, { "epoch": 0.26, "learning_rate": 4.362441399241152e-06, "loss": 1.1934, "step": 8481 }, { "epoch": 0.26, "learning_rate": 4.362278673594889e-06, "loss": 1.2234, "step": 8482 }, { "epoch": 0.26, "learning_rate": 4.36211593022063e-06, "loss": 0.9951, "step": 8483 }, { "epoch": 0.26, "learning_rate": 4.361953169119924e-06, "loss": 1.1299, "step": 8484 }, { "epoch": 0.26, "learning_rate": 4.361790390294321e-06, "loss": 1.1658, "step": 8485 }, { "epoch": 0.26, "learning_rate": 4.36162759374537e-06, "loss": 1.3094, "step": 8486 }, { "epoch": 0.26, "learning_rate": 4.36146477947462e-06, "loss": 1.2307, "step": 8487 }, { "epoch": 0.26, "learning_rate": 4.361301947483623e-06, "loss": 1.0757, "step": 8488 }, { "epoch": 0.26, "learning_rate": 4.3611390977739275e-06, "loss": 1.2039, "step": 8489 }, { "epoch": 0.26, "learning_rate": 4.360976230347085e-06, "loss": 1.0854, "step": 8490 }, { "epoch": 0.26, "learning_rate": 4.3608133452046434e-06, "loss": 1.1748, "step": 8491 }, { "epoch": 0.26, "learning_rate": 4.360650442348156e-06, "loss": 1.2341, "step": 8492 }, { "epoch": 0.26, "learning_rate": 4.360487521779173e-06, "loss": 1.0883, "step": 8493 }, { "epoch": 0.26, "learning_rate": 4.360324583499243e-06, "loss": 1.0439, "step": 8494 }, { "epoch": 0.26, "learning_rate": 4.360161627509921e-06, "loss": 1.0557, "step": 8495 }, { "epoch": 0.26, "learning_rate": 4.359998653812755e-06, "loss": 1.0796, "step": 8496 }, { "epoch": 0.26, "learning_rate": 4.3598356624092975e-06, "loss": 1.1603, "step": 8497 }, { "epoch": 0.26, "learning_rate": 4.3596726533011005e-06, "loss": 1.2026, "step": 8498 }, { "epoch": 0.26, "learning_rate": 4.359509626489716e-06, "loss": 1.1816, "step": 8499 }, { "epoch": 0.26, "learning_rate": 4.3593465819766944e-06, "loss": 1.1661, "step": 8500 }, { "epoch": 0.26, "learning_rate": 4.35918351976359e-06, "loss": 1.0668, "step": 8501 }, { "epoch": 0.26, "learning_rate": 4.359020439851953e-06, "loss": 1.1362, "step": 8502 }, { "epoch": 0.26, "learning_rate": 4.358857342243337e-06, "loss": 1.0624, "step": 8503 }, { "epoch": 0.26, "learning_rate": 4.3586942269392955e-06, "loss": 1.1605, "step": 8504 }, { "epoch": 0.26, "learning_rate": 4.358531093941378e-06, "loss": 1.2486, "step": 8505 }, { "epoch": 0.26, "learning_rate": 4.358367943251141e-06, "loss": 1.1594, "step": 8506 }, { "epoch": 0.26, "learning_rate": 4.358204774870136e-06, "loss": 1.1587, "step": 8507 }, { "epoch": 0.26, "learning_rate": 4.358041588799916e-06, "loss": 1.1262, "step": 8508 }, { "epoch": 0.26, "learning_rate": 4.357878385042036e-06, "loss": 1.1638, "step": 8509 }, { "epoch": 0.26, "learning_rate": 4.3577151635980475e-06, "loss": 1.1164, "step": 8510 }, { "epoch": 0.26, "learning_rate": 4.357551924469505e-06, "loss": 1.0367, "step": 8511 }, { "epoch": 0.26, "learning_rate": 4.357388667657964e-06, "loss": 1.2826, "step": 8512 }, { "epoch": 0.26, "learning_rate": 4.357225393164977e-06, "loss": 1.101, "step": 8513 }, { "epoch": 0.26, "learning_rate": 4.357062100992099e-06, "loss": 1.1979, "step": 8514 }, { "epoch": 0.26, "learning_rate": 4.356898791140884e-06, "loss": 1.1063, "step": 8515 }, { "epoch": 0.26, "learning_rate": 4.3567354636128865e-06, "loss": 1.1498, "step": 8516 }, { "epoch": 0.26, "learning_rate": 4.356572118409661e-06, "loss": 1.209, "step": 8517 }, { "epoch": 0.26, "learning_rate": 4.356408755532764e-06, "loss": 1.2142, "step": 8518 }, { "epoch": 0.26, "learning_rate": 4.35624537498375e-06, "loss": 1.0558, "step": 8519 }, { "epoch": 0.26, "learning_rate": 4.356081976764174e-06, "loss": 1.0837, "step": 8520 }, { "epoch": 0.26, "learning_rate": 4.355918560875591e-06, "loss": 1.1962, "step": 8521 }, { "epoch": 0.26, "learning_rate": 4.355755127319558e-06, "loss": 1.2678, "step": 8522 }, { "epoch": 0.26, "learning_rate": 4.355591676097628e-06, "loss": 1.1816, "step": 8523 }, { "epoch": 0.26, "learning_rate": 4.35542820721136e-06, "loss": 1.2585, "step": 8524 }, { "epoch": 0.26, "learning_rate": 4.35526472066231e-06, "loss": 1.2616, "step": 8525 }, { "epoch": 0.26, "learning_rate": 4.355101216452032e-06, "loss": 1.0997, "step": 8526 }, { "epoch": 0.26, "learning_rate": 4.3549376945820854e-06, "loss": 1.1052, "step": 8527 }, { "epoch": 0.26, "learning_rate": 4.354774155054024e-06, "loss": 1.1348, "step": 8528 }, { "epoch": 0.26, "learning_rate": 4.3546105978694065e-06, "loss": 1.1252, "step": 8529 }, { "epoch": 0.26, "learning_rate": 4.354447023029789e-06, "loss": 1.1876, "step": 8530 }, { "epoch": 0.26, "learning_rate": 4.3542834305367286e-06, "loss": 1.201, "step": 8531 }, { "epoch": 0.26, "learning_rate": 4.354119820391785e-06, "loss": 1.1351, "step": 8532 }, { "epoch": 0.26, "learning_rate": 4.353956192596512e-06, "loss": 1.0948, "step": 8533 }, { "epoch": 0.26, "learning_rate": 4.353792547152469e-06, "loss": 1.0851, "step": 8534 }, { "epoch": 0.26, "learning_rate": 4.353628884061214e-06, "loss": 1.2224, "step": 8535 }, { "epoch": 0.26, "learning_rate": 4.353465203324304e-06, "loss": 1.0375, "step": 8536 }, { "epoch": 0.26, "learning_rate": 4.353301504943299e-06, "loss": 1.0744, "step": 8537 }, { "epoch": 0.26, "learning_rate": 4.353137788919756e-06, "loss": 1.118, "step": 8538 }, { "epoch": 0.26, "learning_rate": 4.352974055255233e-06, "loss": 1.1786, "step": 8539 }, { "epoch": 0.26, "learning_rate": 4.352810303951291e-06, "loss": 1.2108, "step": 8540 }, { "epoch": 0.26, "learning_rate": 4.3526465350094855e-06, "loss": 1.0214, "step": 8541 }, { "epoch": 0.26, "learning_rate": 4.352482748431378e-06, "loss": 1.1922, "step": 8542 }, { "epoch": 0.26, "learning_rate": 4.352318944218527e-06, "loss": 1.2457, "step": 8543 }, { "epoch": 0.26, "learning_rate": 4.352155122372492e-06, "loss": 1.1888, "step": 8544 }, { "epoch": 0.26, "learning_rate": 4.351991282894832e-06, "loss": 1.1977, "step": 8545 }, { "epoch": 0.26, "learning_rate": 4.3518274257871065e-06, "loss": 1.1412, "step": 8546 }, { "epoch": 0.26, "learning_rate": 4.351663551050877e-06, "loss": 1.159, "step": 8547 }, { "epoch": 0.26, "learning_rate": 4.351499658687701e-06, "loss": 1.1115, "step": 8548 }, { "epoch": 0.26, "learning_rate": 4.35133574869914e-06, "loss": 1.1757, "step": 8549 }, { "epoch": 0.26, "learning_rate": 4.351171821086755e-06, "loss": 1.1909, "step": 8550 }, { "epoch": 0.26, "learning_rate": 4.351007875852106e-06, "loss": 1.1001, "step": 8551 }, { "epoch": 0.26, "learning_rate": 4.350843912996753e-06, "loss": 1.1065, "step": 8552 }, { "epoch": 0.26, "learning_rate": 4.350679932522257e-06, "loss": 1.0572, "step": 8553 }, { "epoch": 0.26, "learning_rate": 4.35051593443018e-06, "loss": 1.1382, "step": 8554 }, { "epoch": 0.26, "learning_rate": 4.350351918722082e-06, "loss": 1.2202, "step": 8555 }, { "epoch": 0.26, "learning_rate": 4.3501878853995246e-06, "loss": 0.8915, "step": 8556 }, { "epoch": 0.26, "learning_rate": 4.350023834464071e-06, "loss": 1.094, "step": 8557 }, { "epoch": 0.26, "learning_rate": 4.34985976591728e-06, "loss": 1.0967, "step": 8558 }, { "epoch": 0.26, "learning_rate": 4.349695679760716e-06, "loss": 1.0784, "step": 8559 }, { "epoch": 0.26, "learning_rate": 4.34953157599594e-06, "loss": 1.1101, "step": 8560 }, { "epoch": 0.26, "learning_rate": 4.349367454624513e-06, "loss": 1.1342, "step": 8561 }, { "epoch": 0.26, "learning_rate": 4.349203315648e-06, "loss": 1.1888, "step": 8562 }, { "epoch": 0.26, "learning_rate": 4.349039159067961e-06, "loss": 1.2009, "step": 8563 }, { "epoch": 0.26, "learning_rate": 4.34887498488596e-06, "loss": 1.03, "step": 8564 }, { "epoch": 0.26, "learning_rate": 4.34871079310356e-06, "loss": 1.1241, "step": 8565 }, { "epoch": 0.26, "learning_rate": 4.3485465837223235e-06, "loss": 1.2004, "step": 8566 }, { "epoch": 0.26, "learning_rate": 4.348382356743813e-06, "loss": 1.1026, "step": 8567 }, { "epoch": 0.26, "learning_rate": 4.3482181121695936e-06, "loss": 1.1145, "step": 8568 }, { "epoch": 0.26, "learning_rate": 4.348053850001228e-06, "loss": 1.1708, "step": 8569 }, { "epoch": 0.26, "learning_rate": 4.347889570240279e-06, "loss": 1.157, "step": 8570 }, { "epoch": 0.26, "learning_rate": 4.3477252728883115e-06, "loss": 1.162, "step": 8571 }, { "epoch": 0.26, "learning_rate": 4.34756095794689e-06, "loss": 1.0731, "step": 8572 }, { "epoch": 0.26, "learning_rate": 4.347396625417577e-06, "loss": 1.1414, "step": 8573 }, { "epoch": 0.26, "learning_rate": 4.347232275301938e-06, "loss": 1.1259, "step": 8574 }, { "epoch": 0.26, "learning_rate": 4.347067907601539e-06, "loss": 1.1721, "step": 8575 }, { "epoch": 0.26, "learning_rate": 4.346903522317941e-06, "loss": 1.2223, "step": 8576 }, { "epoch": 0.26, "learning_rate": 4.346739119452712e-06, "loss": 1.1547, "step": 8577 }, { "epoch": 0.26, "learning_rate": 4.346574699007416e-06, "loss": 1.0729, "step": 8578 }, { "epoch": 0.26, "learning_rate": 4.346410260983618e-06, "loss": 1.1476, "step": 8579 }, { "epoch": 0.26, "learning_rate": 4.3462458053828835e-06, "loss": 1.202, "step": 8580 }, { "epoch": 0.26, "learning_rate": 4.346081332206778e-06, "loss": 1.1189, "step": 8581 }, { "epoch": 0.26, "learning_rate": 4.345916841456867e-06, "loss": 1.1805, "step": 8582 }, { "epoch": 0.26, "learning_rate": 4.345752333134718e-06, "loss": 1.1215, "step": 8583 }, { "epoch": 0.26, "learning_rate": 4.345587807241895e-06, "loss": 1.0649, "step": 8584 }, { "epoch": 0.26, "learning_rate": 4.345423263779964e-06, "loss": 1.1458, "step": 8585 }, { "epoch": 0.26, "learning_rate": 4.345258702750493e-06, "loss": 1.1295, "step": 8586 }, { "epoch": 0.26, "learning_rate": 4.345094124155049e-06, "loss": 1.1151, "step": 8587 }, { "epoch": 0.26, "learning_rate": 4.3449295279951965e-06, "loss": 1.2026, "step": 8588 }, { "epoch": 0.26, "learning_rate": 4.344764914272503e-06, "loss": 1.2, "step": 8589 }, { "epoch": 0.26, "learning_rate": 4.344600282988537e-06, "loss": 1.1615, "step": 8590 }, { "epoch": 0.26, "learning_rate": 4.344435634144864e-06, "loss": 1.0801, "step": 8591 }, { "epoch": 0.26, "learning_rate": 4.344270967743052e-06, "loss": 1.2502, "step": 8592 }, { "epoch": 0.26, "learning_rate": 4.344106283784669e-06, "loss": 1.1459, "step": 8593 }, { "epoch": 0.26, "learning_rate": 4.343941582271283e-06, "loss": 1.2017, "step": 8594 }, { "epoch": 0.26, "learning_rate": 4.3437768632044605e-06, "loss": 1.1784, "step": 8595 }, { "epoch": 0.26, "learning_rate": 4.34361212658577e-06, "loss": 1.1374, "step": 8596 }, { "epoch": 0.26, "learning_rate": 4.34344737241678e-06, "loss": 1.0885, "step": 8597 }, { "epoch": 0.26, "learning_rate": 4.343282600699059e-06, "loss": 1.1718, "step": 8598 }, { "epoch": 0.26, "learning_rate": 4.343117811434176e-06, "loss": 1.1594, "step": 8599 }, { "epoch": 0.26, "learning_rate": 4.342953004623698e-06, "loss": 1.3053, "step": 8600 }, { "epoch": 0.26, "learning_rate": 4.342788180269196e-06, "loss": 1.1888, "step": 8601 }, { "epoch": 0.26, "learning_rate": 4.342623338372237e-06, "loss": 1.1623, "step": 8602 }, { "epoch": 0.26, "learning_rate": 4.342458478934392e-06, "loss": 1.149, "step": 8603 }, { "epoch": 0.26, "learning_rate": 4.342293601957229e-06, "loss": 1.1031, "step": 8604 }, { "epoch": 0.26, "learning_rate": 4.342128707442319e-06, "loss": 1.157, "step": 8605 }, { "epoch": 0.26, "learning_rate": 4.341963795391231e-06, "loss": 1.1432, "step": 8606 }, { "epoch": 0.26, "learning_rate": 4.341798865805534e-06, "loss": 1.1542, "step": 8607 }, { "epoch": 0.26, "learning_rate": 4.341633918686799e-06, "loss": 1.1193, "step": 8608 }, { "epoch": 0.26, "learning_rate": 4.341468954036597e-06, "loss": 1.0295, "step": 8609 }, { "epoch": 0.26, "learning_rate": 4.341303971856496e-06, "loss": 1.1329, "step": 8610 }, { "epoch": 0.26, "learning_rate": 4.341138972148069e-06, "loss": 1.267, "step": 8611 }, { "epoch": 0.26, "learning_rate": 4.3409739549128845e-06, "loss": 1.1143, "step": 8612 }, { "epoch": 0.26, "learning_rate": 4.340808920152516e-06, "loss": 1.2426, "step": 8613 }, { "epoch": 0.26, "learning_rate": 4.340643867868533e-06, "loss": 1.1676, "step": 8614 }, { "epoch": 0.26, "learning_rate": 4.3404787980625065e-06, "loss": 1.2199, "step": 8615 }, { "epoch": 0.26, "learning_rate": 4.340313710736009e-06, "loss": 1.1652, "step": 8616 }, { "epoch": 0.26, "learning_rate": 4.34014860589061e-06, "loss": 1.2489, "step": 8617 }, { "epoch": 0.26, "learning_rate": 4.339983483527883e-06, "loss": 1.2445, "step": 8618 }, { "epoch": 0.26, "learning_rate": 4.339818343649399e-06, "loss": 1.1758, "step": 8619 }, { "epoch": 0.26, "learning_rate": 4.339653186256731e-06, "loss": 1.1249, "step": 8620 }, { "epoch": 0.26, "learning_rate": 4.3394880113514504e-06, "loss": 1.1168, "step": 8621 }, { "epoch": 0.26, "learning_rate": 4.33932281893513e-06, "loss": 1.0086, "step": 8622 }, { "epoch": 0.26, "learning_rate": 4.3391576090093425e-06, "loss": 1.103, "step": 8623 }, { "epoch": 0.26, "learning_rate": 4.33899238157566e-06, "loss": 1.061, "step": 8624 }, { "epoch": 0.26, "learning_rate": 4.338827136635656e-06, "loss": 1.2271, "step": 8625 }, { "epoch": 0.26, "learning_rate": 4.3386618741909035e-06, "loss": 1.1028, "step": 8626 }, { "epoch": 0.26, "learning_rate": 4.338496594242975e-06, "loss": 1.0814, "step": 8627 }, { "epoch": 0.26, "learning_rate": 4.338331296793444e-06, "loss": 1.051, "step": 8628 }, { "epoch": 0.26, "learning_rate": 4.338165981843885e-06, "loss": 1.1196, "step": 8629 }, { "epoch": 0.26, "learning_rate": 4.338000649395871e-06, "loss": 1.1034, "step": 8630 }, { "epoch": 0.26, "learning_rate": 4.337835299450976e-06, "loss": 1.0552, "step": 8631 }, { "epoch": 0.26, "learning_rate": 4.337669932010774e-06, "loss": 1.0574, "step": 8632 }, { "epoch": 0.26, "learning_rate": 4.3375045470768395e-06, "loss": 1.1597, "step": 8633 }, { "epoch": 0.26, "learning_rate": 4.337339144650746e-06, "loss": 1.0275, "step": 8634 }, { "epoch": 0.26, "learning_rate": 4.33717372473407e-06, "loss": 1.2061, "step": 8635 }, { "epoch": 0.26, "learning_rate": 4.337008287328384e-06, "loss": 1.2113, "step": 8636 }, { "epoch": 0.26, "learning_rate": 4.336842832435264e-06, "loss": 1.3286, "step": 8637 }, { "epoch": 0.26, "learning_rate": 4.336677360056285e-06, "loss": 1.0542, "step": 8638 }, { "epoch": 0.26, "learning_rate": 4.336511870193023e-06, "loss": 1.138, "step": 8639 }, { "epoch": 0.26, "learning_rate": 4.336346362847051e-06, "loss": 1.1033, "step": 8640 }, { "epoch": 0.26, "learning_rate": 4.336180838019946e-06, "loss": 1.1791, "step": 8641 }, { "epoch": 0.26, "learning_rate": 4.336015295713285e-06, "loss": 1.0822, "step": 8642 }, { "epoch": 0.26, "learning_rate": 4.335849735928643e-06, "loss": 1.1235, "step": 8643 }, { "epoch": 0.26, "learning_rate": 4.3356841586675934e-06, "loss": 1.1382, "step": 8644 }, { "epoch": 0.26, "learning_rate": 4.335518563931717e-06, "loss": 1.1141, "step": 8645 }, { "epoch": 0.26, "learning_rate": 4.335352951722587e-06, "loss": 1.1614, "step": 8646 }, { "epoch": 0.26, "learning_rate": 4.33518732204178e-06, "loss": 1.054, "step": 8647 }, { "epoch": 0.26, "learning_rate": 4.335021674890875e-06, "loss": 1.096, "step": 8648 }, { "epoch": 0.26, "learning_rate": 4.334856010271446e-06, "loss": 1.1187, "step": 8649 }, { "epoch": 0.26, "learning_rate": 4.334690328185073e-06, "loss": 1.2054, "step": 8650 }, { "epoch": 0.26, "learning_rate": 4.3345246286333305e-06, "loss": 1.1805, "step": 8651 }, { "epoch": 0.26, "learning_rate": 4.334358911617797e-06, "loss": 1.0571, "step": 8652 }, { "epoch": 0.26, "learning_rate": 4.334193177140051e-06, "loss": 1.1279, "step": 8653 }, { "epoch": 0.26, "learning_rate": 4.334027425201669e-06, "loss": 1.1771, "step": 8654 }, { "epoch": 0.26, "learning_rate": 4.333861655804229e-06, "loss": 1.0914, "step": 8655 }, { "epoch": 0.26, "learning_rate": 4.33369586894931e-06, "loss": 1.2642, "step": 8656 }, { "epoch": 0.26, "learning_rate": 4.333530064638489e-06, "loss": 1.2459, "step": 8657 }, { "epoch": 0.26, "learning_rate": 4.333364242873344e-06, "loss": 1.0617, "step": 8658 }, { "epoch": 0.26, "learning_rate": 4.333198403655455e-06, "loss": 1.1063, "step": 8659 }, { "epoch": 0.26, "learning_rate": 4.3330325469864e-06, "loss": 1.0745, "step": 8660 }, { "epoch": 0.26, "learning_rate": 4.332866672867759e-06, "loss": 1.2563, "step": 8661 }, { "epoch": 0.26, "learning_rate": 4.3327007813011094e-06, "loss": 1.0447, "step": 8662 }, { "epoch": 0.26, "learning_rate": 4.33253487228803e-06, "loss": 1.1747, "step": 8663 }, { "epoch": 0.26, "learning_rate": 4.332368945830102e-06, "loss": 1.2081, "step": 8664 }, { "epoch": 0.26, "learning_rate": 4.332203001928905e-06, "loss": 1.0771, "step": 8665 }, { "epoch": 0.26, "learning_rate": 4.332037040586016e-06, "loss": 1.1259, "step": 8666 }, { "epoch": 0.26, "learning_rate": 4.331871061803018e-06, "loss": 1.1165, "step": 8667 }, { "epoch": 0.26, "learning_rate": 4.331705065581489e-06, "loss": 1.0987, "step": 8668 }, { "epoch": 0.26, "learning_rate": 4.331539051923011e-06, "loss": 1.1262, "step": 8669 }, { "epoch": 0.26, "learning_rate": 4.331373020829163e-06, "loss": 1.2201, "step": 8670 }, { "epoch": 0.26, "learning_rate": 4.331206972301525e-06, "loss": 1.065, "step": 8671 }, { "epoch": 0.26, "learning_rate": 4.331040906341679e-06, "loss": 1.0999, "step": 8672 }, { "epoch": 0.26, "learning_rate": 4.330874822951206e-06, "loss": 1.1208, "step": 8673 }, { "epoch": 0.26, "learning_rate": 4.330708722131686e-06, "loss": 1.2562, "step": 8674 }, { "epoch": 0.26, "learning_rate": 4.330542603884701e-06, "loss": 1.1779, "step": 8675 }, { "epoch": 0.26, "learning_rate": 4.330376468211832e-06, "loss": 1.0881, "step": 8676 }, { "epoch": 0.26, "learning_rate": 4.33021031511466e-06, "loss": 1.1997, "step": 8677 }, { "epoch": 0.26, "learning_rate": 4.330044144594767e-06, "loss": 1.1531, "step": 8678 }, { "epoch": 0.26, "learning_rate": 4.3298779566537365e-06, "loss": 1.2212, "step": 8679 }, { "epoch": 0.26, "learning_rate": 4.329711751293147e-06, "loss": 1.198, "step": 8680 }, { "epoch": 0.26, "learning_rate": 4.329545528514585e-06, "loss": 1.1717, "step": 8681 }, { "epoch": 0.26, "learning_rate": 4.32937928831963e-06, "loss": 1.0708, "step": 8682 }, { "epoch": 0.26, "learning_rate": 4.329213030709865e-06, "loss": 1.064, "step": 8683 }, { "epoch": 0.26, "learning_rate": 4.329046755686873e-06, "loss": 1.2774, "step": 8684 }, { "epoch": 0.26, "learning_rate": 4.328880463252237e-06, "loss": 1.0828, "step": 8685 }, { "epoch": 0.26, "learning_rate": 4.3287141534075395e-06, "loss": 1.2117, "step": 8686 }, { "epoch": 0.26, "learning_rate": 4.328547826154364e-06, "loss": 1.1906, "step": 8687 }, { "epoch": 0.26, "learning_rate": 4.328381481494294e-06, "loss": 1.1286, "step": 8688 }, { "epoch": 0.26, "learning_rate": 4.328215119428913e-06, "loss": 1.0529, "step": 8689 }, { "epoch": 0.26, "learning_rate": 4.328048739959805e-06, "loss": 1.2035, "step": 8690 }, { "epoch": 0.26, "learning_rate": 4.327882343088553e-06, "loss": 1.1161, "step": 8691 }, { "epoch": 0.26, "learning_rate": 4.32771592881674e-06, "loss": 1.1575, "step": 8692 }, { "epoch": 0.26, "learning_rate": 4.327549497145953e-06, "loss": 1.0101, "step": 8693 }, { "epoch": 0.26, "learning_rate": 4.327383048077776e-06, "loss": 1.1242, "step": 8694 }, { "epoch": 0.26, "learning_rate": 4.32721658161379e-06, "loss": 1.1573, "step": 8695 }, { "epoch": 0.26, "learning_rate": 4.327050097755584e-06, "loss": 1.174, "step": 8696 }, { "epoch": 0.26, "learning_rate": 4.32688359650474e-06, "loss": 1.048, "step": 8697 }, { "epoch": 0.26, "learning_rate": 4.326717077862845e-06, "loss": 1.1521, "step": 8698 }, { "epoch": 0.26, "learning_rate": 4.3265505418314825e-06, "loss": 1.1105, "step": 8699 }, { "epoch": 0.26, "learning_rate": 4.32638398841224e-06, "loss": 1.1761, "step": 8700 }, { "epoch": 0.26, "learning_rate": 4.326217417606699e-06, "loss": 1.1326, "step": 8701 }, { "epoch": 0.26, "learning_rate": 4.326050829416449e-06, "loss": 1.1396, "step": 8702 }, { "epoch": 0.26, "learning_rate": 4.325884223843075e-06, "loss": 1.2943, "step": 8703 }, { "epoch": 0.26, "learning_rate": 4.325717600888163e-06, "loss": 1.0061, "step": 8704 }, { "epoch": 0.26, "learning_rate": 4.325550960553298e-06, "loss": 1.2117, "step": 8705 }, { "epoch": 0.26, "learning_rate": 4.325384302840066e-06, "loss": 1.134, "step": 8706 }, { "epoch": 0.26, "learning_rate": 4.3252176277500555e-06, "loss": 1.17, "step": 8707 }, { "epoch": 0.26, "learning_rate": 4.325050935284853e-06, "loss": 1.1079, "step": 8708 }, { "epoch": 0.26, "learning_rate": 4.324884225446043e-06, "loss": 1.1299, "step": 8709 }, { "epoch": 0.26, "learning_rate": 4.324717498235215e-06, "loss": 1.2125, "step": 8710 }, { "epoch": 0.26, "learning_rate": 4.324550753653956e-06, "loss": 1.1035, "step": 8711 }, { "epoch": 0.26, "learning_rate": 4.324383991703851e-06, "loss": 1.2387, "step": 8712 }, { "epoch": 0.26, "learning_rate": 4.32421721238649e-06, "loss": 1.1124, "step": 8713 }, { "epoch": 0.26, "learning_rate": 4.324050415703459e-06, "loss": 1.085, "step": 8714 }, { "epoch": 0.26, "learning_rate": 4.3238836016563475e-06, "loss": 1.0493, "step": 8715 }, { "epoch": 0.26, "learning_rate": 4.323716770246742e-06, "loss": 1.1274, "step": 8716 }, { "epoch": 0.26, "learning_rate": 4.323549921476231e-06, "loss": 1.2571, "step": 8717 }, { "epoch": 0.26, "learning_rate": 4.323383055346403e-06, "loss": 1.334, "step": 8718 }, { "epoch": 0.26, "learning_rate": 4.323216171858847e-06, "loss": 1.2231, "step": 8719 }, { "epoch": 0.26, "learning_rate": 4.3230492710151505e-06, "loss": 1.1841, "step": 8720 }, { "epoch": 0.26, "learning_rate": 4.322882352816903e-06, "loss": 1.1344, "step": 8721 }, { "epoch": 0.26, "learning_rate": 4.322715417265694e-06, "loss": 1.0914, "step": 8722 }, { "epoch": 0.26, "learning_rate": 4.322548464363112e-06, "loss": 1.0628, "step": 8723 }, { "epoch": 0.26, "learning_rate": 4.3223814941107465e-06, "loss": 1.2275, "step": 8724 }, { "epoch": 0.26, "learning_rate": 4.322214506510186e-06, "loss": 1.1477, "step": 8725 }, { "epoch": 0.26, "learning_rate": 4.322047501563022e-06, "loss": 1.1383, "step": 8726 }, { "epoch": 0.26, "learning_rate": 4.321880479270842e-06, "loss": 1.1428, "step": 8727 }, { "epoch": 0.26, "learning_rate": 4.321713439635239e-06, "loss": 1.2921, "step": 8728 }, { "epoch": 0.26, "learning_rate": 4.321546382657801e-06, "loss": 1.0824, "step": 8729 }, { "epoch": 0.26, "learning_rate": 4.321379308340118e-06, "loss": 1.2639, "step": 8730 }, { "epoch": 0.26, "learning_rate": 4.321212216683781e-06, "loss": 1.1536, "step": 8731 }, { "epoch": 0.26, "learning_rate": 4.321045107690381e-06, "loss": 1.1459, "step": 8732 }, { "epoch": 0.26, "learning_rate": 4.3208779813615095e-06, "loss": 1.1374, "step": 8733 }, { "epoch": 0.26, "learning_rate": 4.320710837698756e-06, "loss": 1.1863, "step": 8734 }, { "epoch": 0.26, "learning_rate": 4.3205436767037124e-06, "loss": 1.1287, "step": 8735 }, { "epoch": 0.26, "learning_rate": 4.320376498377969e-06, "loss": 1.1475, "step": 8736 }, { "epoch": 0.26, "learning_rate": 4.320209302723119e-06, "loss": 1.1958, "step": 8737 }, { "epoch": 0.26, "learning_rate": 4.320042089740752e-06, "loss": 1.04, "step": 8738 }, { "epoch": 0.26, "learning_rate": 4.319874859432462e-06, "loss": 1.105, "step": 8739 }, { "epoch": 0.26, "learning_rate": 4.31970761179984e-06, "loss": 1.1215, "step": 8740 }, { "epoch": 0.26, "learning_rate": 4.319540346844478e-06, "loss": 1.1201, "step": 8741 }, { "epoch": 0.26, "learning_rate": 4.319373064567966e-06, "loss": 1.0936, "step": 8742 }, { "epoch": 0.26, "learning_rate": 4.319205764971901e-06, "loss": 1.1192, "step": 8743 }, { "epoch": 0.26, "learning_rate": 4.319038448057873e-06, "loss": 1.1079, "step": 8744 }, { "epoch": 0.26, "learning_rate": 4.318871113827474e-06, "loss": 1.1464, "step": 8745 }, { "epoch": 0.26, "learning_rate": 4.318703762282299e-06, "loss": 1.0402, "step": 8746 }, { "epoch": 0.26, "learning_rate": 4.31853639342394e-06, "loss": 1.1134, "step": 8747 }, { "epoch": 0.26, "learning_rate": 4.3183690072539895e-06, "loss": 1.1464, "step": 8748 }, { "epoch": 0.26, "learning_rate": 4.318201603774043e-06, "loss": 1.0464, "step": 8749 }, { "epoch": 0.26, "learning_rate": 4.318034182985692e-06, "loss": 1.0597, "step": 8750 }, { "epoch": 0.26, "learning_rate": 4.317866744890531e-06, "loss": 1.2021, "step": 8751 }, { "epoch": 0.26, "learning_rate": 4.317699289490155e-06, "loss": 1.1422, "step": 8752 }, { "epoch": 0.26, "learning_rate": 4.317531816786157e-06, "loss": 1.1305, "step": 8753 }, { "epoch": 0.26, "learning_rate": 4.317364326780131e-06, "loss": 1.2868, "step": 8754 }, { "epoch": 0.26, "learning_rate": 4.317196819473672e-06, "loss": 1.2644, "step": 8755 }, { "epoch": 0.26, "learning_rate": 4.317029294868375e-06, "loss": 1.1208, "step": 8756 }, { "epoch": 0.26, "learning_rate": 4.316861752965833e-06, "loss": 1.0956, "step": 8757 }, { "epoch": 0.26, "learning_rate": 4.316694193767643e-06, "loss": 1.1184, "step": 8758 }, { "epoch": 0.26, "learning_rate": 4.3165266172754e-06, "loss": 1.1622, "step": 8759 }, { "epoch": 0.26, "learning_rate": 4.316359023490697e-06, "loss": 1.1792, "step": 8760 }, { "epoch": 0.26, "learning_rate": 4.316191412415132e-06, "loss": 1.2594, "step": 8761 }, { "epoch": 0.26, "learning_rate": 4.316023784050298e-06, "loss": 1.2888, "step": 8762 }, { "epoch": 0.26, "learning_rate": 4.315856138397793e-06, "loss": 1.1204, "step": 8763 }, { "epoch": 0.26, "learning_rate": 4.315688475459213e-06, "loss": 1.2872, "step": 8764 }, { "epoch": 0.26, "learning_rate": 4.3155207952361525e-06, "loss": 1.1531, "step": 8765 }, { "epoch": 0.26, "learning_rate": 4.315353097730208e-06, "loss": 1.1436, "step": 8766 }, { "epoch": 0.26, "learning_rate": 4.315185382942977e-06, "loss": 1.1478, "step": 8767 }, { "epoch": 0.26, "learning_rate": 4.315017650876055e-06, "loss": 1.0079, "step": 8768 }, { "epoch": 0.26, "learning_rate": 4.314849901531038e-06, "loss": 1.1091, "step": 8769 }, { "epoch": 0.26, "learning_rate": 4.3146821349095255e-06, "loss": 1.2197, "step": 8770 }, { "epoch": 0.26, "learning_rate": 4.314514351013113e-06, "loss": 1.0529, "step": 8771 }, { "epoch": 0.26, "learning_rate": 4.314346549843398e-06, "loss": 1.1516, "step": 8772 }, { "epoch": 0.26, "learning_rate": 4.314178731401977e-06, "loss": 1.1104, "step": 8773 }, { "epoch": 0.26, "learning_rate": 4.314010895690449e-06, "loss": 1.2328, "step": 8774 }, { "epoch": 0.26, "learning_rate": 4.313843042710409e-06, "loss": 1.2449, "step": 8775 }, { "epoch": 0.26, "learning_rate": 4.313675172463459e-06, "loss": 1.1816, "step": 8776 }, { "epoch": 0.26, "learning_rate": 4.3135072849511935e-06, "loss": 1.1885, "step": 8777 }, { "epoch": 0.26, "learning_rate": 4.313339380175213e-06, "loss": 1.1189, "step": 8778 }, { "epoch": 0.26, "learning_rate": 4.313171458137114e-06, "loss": 1.0867, "step": 8779 }, { "epoch": 0.26, "learning_rate": 4.313003518838497e-06, "loss": 1.0715, "step": 8780 }, { "epoch": 0.26, "learning_rate": 4.31283556228096e-06, "loss": 1.182, "step": 8781 }, { "epoch": 0.26, "learning_rate": 4.312667588466099e-06, "loss": 1.1343, "step": 8782 }, { "epoch": 0.26, "learning_rate": 4.312499597395518e-06, "loss": 1.1705, "step": 8783 }, { "epoch": 0.26, "learning_rate": 4.312331589070813e-06, "loss": 1.1937, "step": 8784 }, { "epoch": 0.26, "learning_rate": 4.312163563493584e-06, "loss": 1.2327, "step": 8785 }, { "epoch": 0.26, "learning_rate": 4.311995520665431e-06, "loss": 1.1735, "step": 8786 }, { "epoch": 0.26, "learning_rate": 4.311827460587953e-06, "loss": 1.0757, "step": 8787 }, { "epoch": 0.26, "learning_rate": 4.31165938326275e-06, "loss": 1.1531, "step": 8788 }, { "epoch": 0.26, "learning_rate": 4.311491288691423e-06, "loss": 1.0825, "step": 8789 }, { "epoch": 0.26, "learning_rate": 4.31132317687557e-06, "loss": 1.1149, "step": 8790 }, { "epoch": 0.26, "learning_rate": 4.311155047816794e-06, "loss": 1.1762, "step": 8791 }, { "epoch": 0.26, "learning_rate": 4.310986901516694e-06, "loss": 1.2268, "step": 8792 }, { "epoch": 0.26, "learning_rate": 4.31081873797687e-06, "loss": 1.0991, "step": 8793 }, { "epoch": 0.26, "learning_rate": 4.310650557198925e-06, "loss": 1.2352, "step": 8794 }, { "epoch": 0.26, "learning_rate": 4.310482359184458e-06, "loss": 1.1009, "step": 8795 }, { "epoch": 0.26, "learning_rate": 4.310314143935071e-06, "loss": 1.0337, "step": 8796 }, { "epoch": 0.27, "learning_rate": 4.310145911452365e-06, "loss": 1.1472, "step": 8797 }, { "epoch": 0.27, "learning_rate": 4.309977661737942e-06, "loss": 1.2031, "step": 8798 }, { "epoch": 0.27, "learning_rate": 4.309809394793404e-06, "loss": 1.1462, "step": 8799 }, { "epoch": 0.27, "learning_rate": 4.309641110620352e-06, "loss": 1.176, "step": 8800 }, { "epoch": 0.27, "learning_rate": 4.309472809220388e-06, "loss": 1.0925, "step": 8801 }, { "epoch": 0.27, "learning_rate": 4.309304490595113e-06, "loss": 1.1738, "step": 8802 }, { "epoch": 0.27, "learning_rate": 4.309136154746132e-06, "loss": 1.1196, "step": 8803 }, { "epoch": 0.27, "learning_rate": 4.308967801675046e-06, "loss": 1.1007, "step": 8804 }, { "epoch": 0.27, "learning_rate": 4.308799431383457e-06, "loss": 1.2717, "step": 8805 }, { "epoch": 0.27, "learning_rate": 4.30863104387297e-06, "loss": 1.0263, "step": 8806 }, { "epoch": 0.27, "learning_rate": 4.308462639145186e-06, "loss": 1.1437, "step": 8807 }, { "epoch": 0.27, "learning_rate": 4.308294217201707e-06, "loss": 1.2017, "step": 8808 }, { "epoch": 0.27, "learning_rate": 4.30812577804414e-06, "loss": 1.1136, "step": 8809 }, { "epoch": 0.27, "learning_rate": 4.3079573216740855e-06, "loss": 1.1036, "step": 8810 }, { "epoch": 0.27, "learning_rate": 4.307788848093148e-06, "loss": 1.2711, "step": 8811 }, { "epoch": 0.27, "learning_rate": 4.307620357302932e-06, "loss": 1.2437, "step": 8812 }, { "epoch": 0.27, "learning_rate": 4.30745184930504e-06, "loss": 1.0417, "step": 8813 }, { "epoch": 0.27, "learning_rate": 4.307283324101078e-06, "loss": 1.239, "step": 8814 }, { "epoch": 0.27, "learning_rate": 4.3071147816926484e-06, "loss": 1.2433, "step": 8815 }, { "epoch": 0.27, "learning_rate": 4.306946222081356e-06, "loss": 1.105, "step": 8816 }, { "epoch": 0.27, "learning_rate": 4.306777645268806e-06, "loss": 1.0569, "step": 8817 }, { "epoch": 0.27, "learning_rate": 4.306609051256603e-06, "loss": 1.1519, "step": 8818 }, { "epoch": 0.27, "learning_rate": 4.306440440046353e-06, "loss": 1.0289, "step": 8819 }, { "epoch": 0.27, "learning_rate": 4.306271811639659e-06, "loss": 1.174, "step": 8820 }, { "epoch": 0.27, "learning_rate": 4.3061031660381275e-06, "loss": 1.1023, "step": 8821 }, { "epoch": 0.27, "learning_rate": 4.305934503243364e-06, "loss": 1.067, "step": 8822 }, { "epoch": 0.27, "learning_rate": 4.305765823256973e-06, "loss": 1.1971, "step": 8823 }, { "epoch": 0.27, "learning_rate": 4.305597126080562e-06, "loss": 1.2474, "step": 8824 }, { "epoch": 0.27, "learning_rate": 4.305428411715735e-06, "loss": 1.0916, "step": 8825 }, { "epoch": 0.27, "learning_rate": 4.3052596801641e-06, "loss": 1.1628, "step": 8826 }, { "epoch": 0.27, "learning_rate": 4.305090931427262e-06, "loss": 1.0533, "step": 8827 }, { "epoch": 0.27, "learning_rate": 4.304922165506827e-06, "loss": 1.0348, "step": 8828 }, { "epoch": 0.27, "learning_rate": 4.304753382404403e-06, "loss": 1.2133, "step": 8829 }, { "epoch": 0.27, "learning_rate": 4.304584582121596e-06, "loss": 1.2216, "step": 8830 }, { "epoch": 0.27, "learning_rate": 4.304415764660013e-06, "loss": 1.1978, "step": 8831 }, { "epoch": 0.27, "learning_rate": 4.30424693002126e-06, "loss": 1.2048, "step": 8832 }, { "epoch": 0.27, "learning_rate": 4.304078078206946e-06, "loss": 1.1185, "step": 8833 }, { "epoch": 0.27, "learning_rate": 4.303909209218677e-06, "loss": 1.1116, "step": 8834 }, { "epoch": 0.27, "learning_rate": 4.303740323058062e-06, "loss": 1.2192, "step": 8835 }, { "epoch": 0.27, "learning_rate": 4.303571419726707e-06, "loss": 1.1454, "step": 8836 }, { "epoch": 0.27, "learning_rate": 4.303402499226221e-06, "loss": 1.1482, "step": 8837 }, { "epoch": 0.27, "learning_rate": 4.303233561558212e-06, "loss": 1.0934, "step": 8838 }, { "epoch": 0.27, "learning_rate": 4.303064606724288e-06, "loss": 1.0638, "step": 8839 }, { "epoch": 0.27, "learning_rate": 4.302895634726057e-06, "loss": 1.0439, "step": 8840 }, { "epoch": 0.27, "learning_rate": 4.302726645565129e-06, "loss": 1.0472, "step": 8841 }, { "epoch": 0.27, "learning_rate": 4.30255763924311e-06, "loss": 1.0364, "step": 8842 }, { "epoch": 0.27, "learning_rate": 4.302388615761611e-06, "loss": 1.2788, "step": 8843 }, { "epoch": 0.27, "learning_rate": 4.302219575122239e-06, "loss": 1.3479, "step": 8844 }, { "epoch": 0.27, "learning_rate": 4.302050517326607e-06, "loss": 1.191, "step": 8845 }, { "epoch": 0.27, "learning_rate": 4.301881442376321e-06, "loss": 1.1122, "step": 8846 }, { "epoch": 0.27, "learning_rate": 4.301712350272991e-06, "loss": 1.1191, "step": 8847 }, { "epoch": 0.27, "learning_rate": 4.301543241018228e-06, "loss": 1.1412, "step": 8848 }, { "epoch": 0.27, "learning_rate": 4.3013741146136406e-06, "loss": 1.266, "step": 8849 }, { "epoch": 0.27, "learning_rate": 4.30120497106084e-06, "loss": 1.1889, "step": 8850 }, { "epoch": 0.27, "learning_rate": 4.301035810361433e-06, "loss": 1.1819, "step": 8851 }, { "epoch": 0.27, "learning_rate": 4.3008666325170355e-06, "loss": 1.1592, "step": 8852 }, { "epoch": 0.27, "learning_rate": 4.300697437529253e-06, "loss": 1.1761, "step": 8853 }, { "epoch": 0.27, "learning_rate": 4.3005282253996996e-06, "loss": 1.2156, "step": 8854 }, { "epoch": 0.27, "learning_rate": 4.300358996129984e-06, "loss": 1.1392, "step": 8855 }, { "epoch": 0.27, "learning_rate": 4.3001897497217186e-06, "loss": 1.2167, "step": 8856 }, { "epoch": 0.27, "learning_rate": 4.300020486176512e-06, "loss": 1.1684, "step": 8857 }, { "epoch": 0.27, "learning_rate": 4.2998512054959785e-06, "loss": 1.1436, "step": 8858 }, { "epoch": 0.27, "learning_rate": 4.299681907681728e-06, "loss": 1.1144, "step": 8859 }, { "epoch": 0.27, "learning_rate": 4.299512592735373e-06, "loss": 1.1127, "step": 8860 }, { "epoch": 0.27, "learning_rate": 4.2993432606585235e-06, "loss": 1.2085, "step": 8861 }, { "epoch": 0.27, "learning_rate": 4.299173911452794e-06, "loss": 1.1202, "step": 8862 }, { "epoch": 0.27, "learning_rate": 4.2990045451197956e-06, "loss": 1.1672, "step": 8863 }, { "epoch": 0.27, "learning_rate": 4.29883516166114e-06, "loss": 1.151, "step": 8864 }, { "epoch": 0.27, "learning_rate": 4.298665761078439e-06, "loss": 1.1138, "step": 8865 }, { "epoch": 0.27, "learning_rate": 4.298496343373307e-06, "loss": 1.0929, "step": 8866 }, { "epoch": 0.27, "learning_rate": 4.298326908547357e-06, "loss": 1.1553, "step": 8867 }, { "epoch": 0.27, "learning_rate": 4.2981574566022e-06, "loss": 1.0873, "step": 8868 }, { "epoch": 0.27, "learning_rate": 4.29798798753945e-06, "loss": 1.1889, "step": 8869 }, { "epoch": 0.27, "learning_rate": 4.29781850136072e-06, "loss": 1.1727, "step": 8870 }, { "epoch": 0.27, "learning_rate": 4.297648998067624e-06, "loss": 1.1829, "step": 8871 }, { "epoch": 0.27, "learning_rate": 4.297479477661775e-06, "loss": 1.1821, "step": 8872 }, { "epoch": 0.27, "learning_rate": 4.297309940144788e-06, "loss": 1.0759, "step": 8873 }, { "epoch": 0.27, "learning_rate": 4.297140385518275e-06, "loss": 1.2217, "step": 8874 }, { "epoch": 0.27, "learning_rate": 4.2969708137838515e-06, "loss": 1.1317, "step": 8875 }, { "epoch": 0.27, "learning_rate": 4.296801224943131e-06, "loss": 1.2098, "step": 8876 }, { "epoch": 0.27, "learning_rate": 4.296631618997728e-06, "loss": 1.1542, "step": 8877 }, { "epoch": 0.27, "learning_rate": 4.2964619959492586e-06, "loss": 1.072, "step": 8878 }, { "epoch": 0.27, "learning_rate": 4.296292355799335e-06, "loss": 1.0927, "step": 8879 }, { "epoch": 0.27, "learning_rate": 4.296122698549574e-06, "loss": 1.0845, "step": 8880 }, { "epoch": 0.27, "learning_rate": 4.29595302420159e-06, "loss": 1.2031, "step": 8881 }, { "epoch": 0.27, "learning_rate": 4.295783332756997e-06, "loss": 1.1674, "step": 8882 }, { "epoch": 0.27, "learning_rate": 4.295613624217413e-06, "loss": 1.1475, "step": 8883 }, { "epoch": 0.27, "learning_rate": 4.295443898584451e-06, "loss": 1.1178, "step": 8884 }, { "epoch": 0.27, "learning_rate": 4.295274155859729e-06, "loss": 1.2244, "step": 8885 }, { "epoch": 0.27, "learning_rate": 4.295104396044861e-06, "loss": 1.2239, "step": 8886 }, { "epoch": 0.27, "learning_rate": 4.2949346191414635e-06, "loss": 1.2347, "step": 8887 }, { "epoch": 0.27, "learning_rate": 4.294764825151153e-06, "loss": 1.1401, "step": 8888 }, { "epoch": 0.27, "learning_rate": 4.2945950140755454e-06, "loss": 1.1016, "step": 8889 }, { "epoch": 0.27, "learning_rate": 4.294425185916258e-06, "loss": 1.12, "step": 8890 }, { "epoch": 0.27, "learning_rate": 4.2942553406749064e-06, "loss": 1.0901, "step": 8891 }, { "epoch": 0.27, "learning_rate": 4.2940854783531096e-06, "loss": 1.1274, "step": 8892 }, { "epoch": 0.27, "learning_rate": 4.2939155989524815e-06, "loss": 1.0998, "step": 8893 }, { "epoch": 0.27, "learning_rate": 4.293745702474642e-06, "loss": 1.2095, "step": 8894 }, { "epoch": 0.27, "learning_rate": 4.293575788921207e-06, "loss": 1.2059, "step": 8895 }, { "epoch": 0.27, "learning_rate": 4.293405858293794e-06, "loss": 1.0933, "step": 8896 }, { "epoch": 0.27, "learning_rate": 4.2932359105940215e-06, "loss": 1.1818, "step": 8897 }, { "epoch": 0.27, "learning_rate": 4.293065945823506e-06, "loss": 1.1946, "step": 8898 }, { "epoch": 0.27, "learning_rate": 4.292895963983866e-06, "loss": 1.1222, "step": 8899 }, { "epoch": 0.27, "learning_rate": 4.292725965076721e-06, "loss": 1.1678, "step": 8900 }, { "epoch": 0.27, "learning_rate": 4.292555949103688e-06, "loss": 1.2596, "step": 8901 }, { "epoch": 0.27, "learning_rate": 4.292385916066385e-06, "loss": 1.1316, "step": 8902 }, { "epoch": 0.27, "learning_rate": 4.292215865966433e-06, "loss": 1.181, "step": 8903 }, { "epoch": 0.27, "learning_rate": 4.292045798805448e-06, "loss": 1.076, "step": 8904 }, { "epoch": 0.27, "learning_rate": 4.29187571458505e-06, "loss": 1.104, "step": 8905 }, { "epoch": 0.27, "learning_rate": 4.291705613306858e-06, "loss": 1.286, "step": 8906 }, { "epoch": 0.27, "learning_rate": 4.291535494972491e-06, "loss": 1.1431, "step": 8907 }, { "epoch": 0.27, "learning_rate": 4.2913653595835705e-06, "loss": 1.1295, "step": 8908 }, { "epoch": 0.27, "learning_rate": 4.291195207141713e-06, "loss": 1.1783, "step": 8909 }, { "epoch": 0.27, "learning_rate": 4.291025037648541e-06, "loss": 1.0871, "step": 8910 }, { "epoch": 0.27, "learning_rate": 4.290854851105672e-06, "loss": 1.0897, "step": 8911 }, { "epoch": 0.27, "learning_rate": 4.290684647514728e-06, "loss": 1.2651, "step": 8912 }, { "epoch": 0.27, "learning_rate": 4.290514426877328e-06, "loss": 1.0588, "step": 8913 }, { "epoch": 0.27, "learning_rate": 4.290344189195094e-06, "loss": 1.0923, "step": 8914 }, { "epoch": 0.27, "learning_rate": 4.290173934469646e-06, "loss": 1.1547, "step": 8915 }, { "epoch": 0.27, "learning_rate": 4.290003662702603e-06, "loss": 1.1174, "step": 8916 }, { "epoch": 0.27, "learning_rate": 4.289833373895588e-06, "loss": 1.1804, "step": 8917 }, { "epoch": 0.27, "learning_rate": 4.289663068050221e-06, "loss": 1.269, "step": 8918 }, { "epoch": 0.27, "learning_rate": 4.289492745168124e-06, "loss": 1.3033, "step": 8919 }, { "epoch": 0.27, "learning_rate": 4.289322405250916e-06, "loss": 1.0831, "step": 8920 }, { "epoch": 0.27, "learning_rate": 4.2891520483002224e-06, "loss": 1.1108, "step": 8921 }, { "epoch": 0.27, "learning_rate": 4.288981674317663e-06, "loss": 1.0806, "step": 8922 }, { "epoch": 0.27, "learning_rate": 4.288811283304859e-06, "loss": 1.2271, "step": 8923 }, { "epoch": 0.27, "learning_rate": 4.288640875263433e-06, "loss": 1.1255, "step": 8924 }, { "epoch": 0.27, "learning_rate": 4.288470450195007e-06, "loss": 1.1486, "step": 8925 }, { "epoch": 0.27, "learning_rate": 4.288300008101205e-06, "loss": 1.2958, "step": 8926 }, { "epoch": 0.27, "learning_rate": 4.288129548983647e-06, "loss": 1.2314, "step": 8927 }, { "epoch": 0.27, "learning_rate": 4.287959072843957e-06, "loss": 1.0612, "step": 8928 }, { "epoch": 0.27, "learning_rate": 4.287788579683759e-06, "loss": 1.0005, "step": 8929 }, { "epoch": 0.27, "learning_rate": 4.287618069504673e-06, "loss": 1.2623, "step": 8930 }, { "epoch": 0.27, "learning_rate": 4.287447542308325e-06, "loss": 1.1404, "step": 8931 }, { "epoch": 0.27, "learning_rate": 4.287276998096337e-06, "loss": 1.1201, "step": 8932 }, { "epoch": 0.27, "learning_rate": 4.287106436870333e-06, "loss": 1.1313, "step": 8933 }, { "epoch": 0.27, "learning_rate": 4.2869358586319355e-06, "loss": 1.2703, "step": 8934 }, { "epoch": 0.27, "learning_rate": 4.286765263382771e-06, "loss": 1.1149, "step": 8935 }, { "epoch": 0.27, "learning_rate": 4.28659465112446e-06, "loss": 1.1994, "step": 8936 }, { "epoch": 0.27, "learning_rate": 4.286424021858629e-06, "loss": 1.0842, "step": 8937 }, { "epoch": 0.27, "learning_rate": 4.286253375586901e-06, "loss": 1.0256, "step": 8938 }, { "epoch": 0.27, "learning_rate": 4.286082712310903e-06, "loss": 1.1284, "step": 8939 }, { "epoch": 0.27, "learning_rate": 4.285912032032256e-06, "loss": 1.1035, "step": 8940 }, { "epoch": 0.27, "learning_rate": 4.285741334752588e-06, "loss": 1.1863, "step": 8941 }, { "epoch": 0.27, "learning_rate": 4.285570620473522e-06, "loss": 1.1743, "step": 8942 }, { "epoch": 0.27, "learning_rate": 4.285399889196683e-06, "loss": 1.2101, "step": 8943 }, { "epoch": 0.27, "learning_rate": 4.2852291409236965e-06, "loss": 1.1922, "step": 8944 }, { "epoch": 0.27, "learning_rate": 4.28505837565619e-06, "loss": 1.1323, "step": 8945 }, { "epoch": 0.27, "learning_rate": 4.284887593395787e-06, "loss": 1.283, "step": 8946 }, { "epoch": 0.27, "learning_rate": 4.284716794144113e-06, "loss": 1.1819, "step": 8947 }, { "epoch": 0.27, "learning_rate": 4.284545977902795e-06, "loss": 1.196, "step": 8948 }, { "epoch": 0.27, "learning_rate": 4.284375144673459e-06, "loss": 1.3448, "step": 8949 }, { "epoch": 0.27, "learning_rate": 4.284204294457731e-06, "loss": 1.2335, "step": 8950 }, { "epoch": 0.27, "learning_rate": 4.284033427257237e-06, "loss": 1.2208, "step": 8951 }, { "epoch": 0.27, "learning_rate": 4.2838625430736046e-06, "loss": 1.1171, "step": 8952 }, { "epoch": 0.27, "learning_rate": 4.28369164190846e-06, "loss": 1.0951, "step": 8953 }, { "epoch": 0.27, "learning_rate": 4.283520723763429e-06, "loss": 1.1286, "step": 8954 }, { "epoch": 0.27, "learning_rate": 4.28334978864014e-06, "loss": 1.1654, "step": 8955 }, { "epoch": 0.27, "learning_rate": 4.2831788365402205e-06, "loss": 1.152, "step": 8956 }, { "epoch": 0.27, "learning_rate": 4.2830078674652965e-06, "loss": 1.0474, "step": 8957 }, { "epoch": 0.27, "learning_rate": 4.282836881416997e-06, "loss": 1.2014, "step": 8958 }, { "epoch": 0.27, "learning_rate": 4.282665878396949e-06, "loss": 1.1311, "step": 8959 }, { "epoch": 0.27, "learning_rate": 4.282494858406781e-06, "loss": 1.1298, "step": 8960 }, { "epoch": 0.27, "learning_rate": 4.282323821448119e-06, "loss": 1.1812, "step": 8961 }, { "epoch": 0.27, "learning_rate": 4.282152767522594e-06, "loss": 1.1141, "step": 8962 }, { "epoch": 0.27, "learning_rate": 4.281981696631832e-06, "loss": 1.128, "step": 8963 }, { "epoch": 0.27, "learning_rate": 4.2818106087774625e-06, "loss": 1.1251, "step": 8964 }, { "epoch": 0.27, "learning_rate": 4.281639503961114e-06, "loss": 1.1646, "step": 8965 }, { "epoch": 0.27, "learning_rate": 4.281468382184416e-06, "loss": 1.1241, "step": 8966 }, { "epoch": 0.27, "learning_rate": 4.281297243448997e-06, "loss": 1.1856, "step": 8967 }, { "epoch": 0.27, "learning_rate": 4.281126087756487e-06, "loss": 1.2209, "step": 8968 }, { "epoch": 0.27, "learning_rate": 4.280954915108513e-06, "loss": 1.2016, "step": 8969 }, { "epoch": 0.27, "learning_rate": 4.280783725506706e-06, "loss": 1.0934, "step": 8970 }, { "epoch": 0.27, "learning_rate": 4.280612518952696e-06, "loss": 1.0954, "step": 8971 }, { "epoch": 0.27, "learning_rate": 4.280441295448112e-06, "loss": 1.0681, "step": 8972 }, { "epoch": 0.27, "learning_rate": 4.280270054994586e-06, "loss": 1.28, "step": 8973 }, { "epoch": 0.27, "learning_rate": 4.280098797593744e-06, "loss": 1.1671, "step": 8974 }, { "epoch": 0.27, "learning_rate": 4.27992752324722e-06, "loss": 1.0878, "step": 8975 }, { "epoch": 0.27, "learning_rate": 4.2797562319566435e-06, "loss": 1.1813, "step": 8976 }, { "epoch": 0.27, "learning_rate": 4.279584923723645e-06, "loss": 0.9933, "step": 8977 }, { "epoch": 0.27, "learning_rate": 4.2794135985498544e-06, "loss": 1.1849, "step": 8978 }, { "epoch": 0.27, "learning_rate": 4.279242256436904e-06, "loss": 1.1835, "step": 8979 }, { "epoch": 0.27, "learning_rate": 4.279070897386424e-06, "loss": 1.1305, "step": 8980 }, { "epoch": 0.27, "learning_rate": 4.278899521400045e-06, "loss": 1.1035, "step": 8981 }, { "epoch": 0.27, "learning_rate": 4.2787281284794e-06, "loss": 1.0959, "step": 8982 }, { "epoch": 0.27, "learning_rate": 4.27855671862612e-06, "loss": 1.0795, "step": 8983 }, { "epoch": 0.27, "learning_rate": 4.278385291841837e-06, "loss": 1.0635, "step": 8984 }, { "epoch": 0.27, "learning_rate": 4.278213848128182e-06, "loss": 1.1336, "step": 8985 }, { "epoch": 0.27, "learning_rate": 4.278042387486787e-06, "loss": 1.0648, "step": 8986 }, { "epoch": 0.27, "learning_rate": 4.277870909919286e-06, "loss": 1.1083, "step": 8987 }, { "epoch": 0.27, "learning_rate": 4.27769941542731e-06, "loss": 1.0873, "step": 8988 }, { "epoch": 0.27, "learning_rate": 4.277527904012491e-06, "loss": 1.1492, "step": 8989 }, { "epoch": 0.27, "learning_rate": 4.277356375676462e-06, "loss": 1.1184, "step": 8990 }, { "epoch": 0.27, "learning_rate": 4.277184830420858e-06, "loss": 1.1379, "step": 8991 }, { "epoch": 0.27, "learning_rate": 4.27701326824731e-06, "loss": 1.134, "step": 8992 }, { "epoch": 0.27, "learning_rate": 4.27684168915745e-06, "loss": 1.1745, "step": 8993 }, { "epoch": 0.27, "learning_rate": 4.276670093152915e-06, "loss": 1.1367, "step": 8994 }, { "epoch": 0.27, "learning_rate": 4.276498480235335e-06, "loss": 1.1113, "step": 8995 }, { "epoch": 0.27, "learning_rate": 4.276326850406345e-06, "loss": 1.113, "step": 8996 }, { "epoch": 0.27, "learning_rate": 4.276155203667579e-06, "loss": 1.0485, "step": 8997 }, { "epoch": 0.27, "learning_rate": 4.275983540020671e-06, "loss": 1.149, "step": 8998 }, { "epoch": 0.27, "learning_rate": 4.275811859467255e-06, "loss": 1.1727, "step": 8999 }, { "epoch": 0.27, "learning_rate": 4.275640162008966e-06, "loss": 1.2222, "step": 9000 }, { "epoch": 0.27, "learning_rate": 4.275468447647438e-06, "loss": 1.1234, "step": 9001 }, { "epoch": 0.27, "learning_rate": 4.275296716384304e-06, "loss": 1.1953, "step": 9002 }, { "epoch": 0.27, "learning_rate": 4.275124968221201e-06, "loss": 1.093, "step": 9003 }, { "epoch": 0.27, "learning_rate": 4.274953203159763e-06, "loss": 1.1807, "step": 9004 }, { "epoch": 0.27, "learning_rate": 4.274781421201626e-06, "loss": 1.2792, "step": 9005 }, { "epoch": 0.27, "learning_rate": 4.2746096223484245e-06, "loss": 1.1591, "step": 9006 }, { "epoch": 0.27, "learning_rate": 4.274437806601794e-06, "loss": 1.0891, "step": 9007 }, { "epoch": 0.27, "learning_rate": 4.2742659739633695e-06, "loss": 1.058, "step": 9008 }, { "epoch": 0.27, "learning_rate": 4.274094124434788e-06, "loss": 1.0943, "step": 9009 }, { "epoch": 0.27, "learning_rate": 4.273922258017685e-06, "loss": 1.0828, "step": 9010 }, { "epoch": 0.27, "learning_rate": 4.273750374713697e-06, "loss": 1.0988, "step": 9011 }, { "epoch": 0.27, "learning_rate": 4.273578474524459e-06, "loss": 1.2403, "step": 9012 }, { "epoch": 0.27, "learning_rate": 4.273406557451608e-06, "loss": 1.088, "step": 9013 }, { "epoch": 0.27, "learning_rate": 4.2732346234967805e-06, "loss": 1.2229, "step": 9014 }, { "epoch": 0.27, "learning_rate": 4.273062672661613e-06, "loss": 1.1648, "step": 9015 }, { "epoch": 0.27, "learning_rate": 4.272890704947744e-06, "loss": 1.0144, "step": 9016 }, { "epoch": 0.27, "learning_rate": 4.272718720356809e-06, "loss": 1.1093, "step": 9017 }, { "epoch": 0.27, "learning_rate": 4.2725467188904455e-06, "loss": 1.187, "step": 9018 }, { "epoch": 0.27, "learning_rate": 4.27237470055029e-06, "loss": 1.1527, "step": 9019 }, { "epoch": 0.27, "learning_rate": 4.2722026653379824e-06, "loss": 1.1018, "step": 9020 }, { "epoch": 0.27, "learning_rate": 4.272030613255158e-06, "loss": 1.1902, "step": 9021 }, { "epoch": 0.27, "learning_rate": 4.2718585443034564e-06, "loss": 1.142, "step": 9022 }, { "epoch": 0.27, "learning_rate": 4.271686458484514e-06, "loss": 1.0395, "step": 9023 }, { "epoch": 0.27, "learning_rate": 4.27151435579997e-06, "loss": 1.064, "step": 9024 }, { "epoch": 0.27, "learning_rate": 4.2713422362514625e-06, "loss": 1.1859, "step": 9025 }, { "epoch": 0.27, "learning_rate": 4.27117009984063e-06, "loss": 1.1697, "step": 9026 }, { "epoch": 0.27, "learning_rate": 4.270997946569112e-06, "loss": 1.2428, "step": 9027 }, { "epoch": 0.27, "learning_rate": 4.2708257764385455e-06, "loss": 1.1973, "step": 9028 }, { "epoch": 0.27, "learning_rate": 4.27065358945057e-06, "loss": 1.1345, "step": 9029 }, { "epoch": 0.27, "learning_rate": 4.270481385606827e-06, "loss": 1.1445, "step": 9030 }, { "epoch": 0.27, "learning_rate": 4.270309164908952e-06, "loss": 1.1616, "step": 9031 }, { "epoch": 0.27, "learning_rate": 4.270136927358588e-06, "loss": 1.1387, "step": 9032 }, { "epoch": 0.27, "learning_rate": 4.269964672957372e-06, "loss": 1.2211, "step": 9033 }, { "epoch": 0.27, "learning_rate": 4.269792401706945e-06, "loss": 1.0892, "step": 9034 }, { "epoch": 0.27, "learning_rate": 4.2696201136089466e-06, "loss": 1.0938, "step": 9035 }, { "epoch": 0.27, "learning_rate": 4.269447808665017e-06, "loss": 1.1801, "step": 9036 }, { "epoch": 0.27, "learning_rate": 4.269275486876796e-06, "loss": 1.0659, "step": 9037 }, { "epoch": 0.27, "learning_rate": 4.269103148245925e-06, "loss": 1.1445, "step": 9038 }, { "epoch": 0.27, "learning_rate": 4.268930792774044e-06, "loss": 1.0942, "step": 9039 }, { "epoch": 0.27, "learning_rate": 4.268758420462794e-06, "loss": 1.0779, "step": 9040 }, { "epoch": 0.27, "learning_rate": 4.2685860313138155e-06, "loss": 1.0579, "step": 9041 }, { "epoch": 0.27, "learning_rate": 4.26841362532875e-06, "loss": 1.0479, "step": 9042 }, { "epoch": 0.27, "learning_rate": 4.268241202509238e-06, "loss": 1.2421, "step": 9043 }, { "epoch": 0.27, "learning_rate": 4.268068762856922e-06, "loss": 1.1439, "step": 9044 }, { "epoch": 0.27, "learning_rate": 4.267896306373442e-06, "loss": 1.1202, "step": 9045 }, { "epoch": 0.27, "learning_rate": 4.267723833060441e-06, "loss": 1.1416, "step": 9046 }, { "epoch": 0.27, "learning_rate": 4.2675513429195605e-06, "loss": 1.2198, "step": 9047 }, { "epoch": 0.27, "learning_rate": 4.267378835952442e-06, "loss": 1.2384, "step": 9048 }, { "epoch": 0.27, "learning_rate": 4.26720631216073e-06, "loss": 1.119, "step": 9049 }, { "epoch": 0.27, "learning_rate": 4.267033771546063e-06, "loss": 1.0582, "step": 9050 }, { "epoch": 0.27, "learning_rate": 4.266861214110086e-06, "loss": 1.2094, "step": 9051 }, { "epoch": 0.27, "learning_rate": 4.266688639854442e-06, "loss": 1.2684, "step": 9052 }, { "epoch": 0.27, "learning_rate": 4.2665160487807724e-06, "loss": 1.2584, "step": 9053 }, { "epoch": 0.27, "learning_rate": 4.266343440890721e-06, "loss": 1.0854, "step": 9054 }, { "epoch": 0.27, "learning_rate": 4.2661708161859304e-06, "loss": 1.2458, "step": 9055 }, { "epoch": 0.27, "learning_rate": 4.265998174668045e-06, "loss": 1.0647, "step": 9056 }, { "epoch": 0.27, "learning_rate": 4.265825516338707e-06, "loss": 1.1754, "step": 9057 }, { "epoch": 0.27, "learning_rate": 4.265652841199561e-06, "loss": 1.1512, "step": 9058 }, { "epoch": 0.27, "learning_rate": 4.265480149252249e-06, "loss": 1.1954, "step": 9059 }, { "epoch": 0.27, "learning_rate": 4.265307440498418e-06, "loss": 1.1539, "step": 9060 }, { "epoch": 0.27, "learning_rate": 4.265134714939709e-06, "loss": 1.2629, "step": 9061 }, { "epoch": 0.27, "learning_rate": 4.264961972577768e-06, "loss": 1.2589, "step": 9062 }, { "epoch": 0.27, "learning_rate": 4.26478921341424e-06, "loss": 1.1626, "step": 9063 }, { "epoch": 0.27, "learning_rate": 4.264616437450767e-06, "loss": 1.0897, "step": 9064 }, { "epoch": 0.27, "learning_rate": 4.264443644688997e-06, "loss": 1.04, "step": 9065 }, { "epoch": 0.27, "learning_rate": 4.264270835130572e-06, "loss": 1.3087, "step": 9066 }, { "epoch": 0.27, "learning_rate": 4.264098008777139e-06, "loss": 1.1443, "step": 9067 }, { "epoch": 0.27, "learning_rate": 4.263925165630343e-06, "loss": 1.0821, "step": 9068 }, { "epoch": 0.27, "learning_rate": 4.2637523056918275e-06, "loss": 1.3202, "step": 9069 }, { "epoch": 0.27, "learning_rate": 4.26357942896324e-06, "loss": 1.1521, "step": 9070 }, { "epoch": 0.27, "learning_rate": 4.2634065354462265e-06, "loss": 1.1404, "step": 9071 }, { "epoch": 0.27, "learning_rate": 4.263233625142432e-06, "loss": 1.0673, "step": 9072 }, { "epoch": 0.27, "learning_rate": 4.263060698053503e-06, "loss": 1.0665, "step": 9073 }, { "epoch": 0.27, "learning_rate": 4.2628877541810835e-06, "loss": 1.1838, "step": 9074 }, { "epoch": 0.27, "learning_rate": 4.262714793526823e-06, "loss": 1.1625, "step": 9075 }, { "epoch": 0.27, "learning_rate": 4.262541816092366e-06, "loss": 1.2363, "step": 9076 }, { "epoch": 0.27, "learning_rate": 4.26236882187936e-06, "loss": 1.1642, "step": 9077 }, { "epoch": 0.27, "learning_rate": 4.262195810889452e-06, "loss": 1.0432, "step": 9078 }, { "epoch": 0.27, "learning_rate": 4.262022783124288e-06, "loss": 1.2277, "step": 9079 }, { "epoch": 0.27, "learning_rate": 4.261849738585516e-06, "loss": 1.2099, "step": 9080 }, { "epoch": 0.27, "learning_rate": 4.261676677274783e-06, "loss": 1.1777, "step": 9081 }, { "epoch": 0.27, "learning_rate": 4.261503599193737e-06, "loss": 1.1218, "step": 9082 }, { "epoch": 0.27, "learning_rate": 4.261330504344024e-06, "loss": 1.0921, "step": 9083 }, { "epoch": 0.27, "learning_rate": 4.261157392727293e-06, "loss": 1.1009, "step": 9084 }, { "epoch": 0.27, "learning_rate": 4.260984264345192e-06, "loss": 1.0857, "step": 9085 }, { "epoch": 0.27, "learning_rate": 4.26081111919937e-06, "loss": 1.2063, "step": 9086 }, { "epoch": 0.27, "learning_rate": 4.260637957291473e-06, "loss": 1.1998, "step": 9087 }, { "epoch": 0.27, "learning_rate": 4.260464778623151e-06, "loss": 1.1154, "step": 9088 }, { "epoch": 0.27, "learning_rate": 4.260291583196052e-06, "loss": 1.0812, "step": 9089 }, { "epoch": 0.27, "learning_rate": 4.260118371011825e-06, "loss": 1.1352, "step": 9090 }, { "epoch": 0.27, "learning_rate": 4.259945142072119e-06, "loss": 1.0485, "step": 9091 }, { "epoch": 0.27, "learning_rate": 4.259771896378583e-06, "loss": 1.2093, "step": 9092 }, { "epoch": 0.27, "learning_rate": 4.259598633932866e-06, "loss": 1.2193, "step": 9093 }, { "epoch": 0.27, "learning_rate": 4.259425354736617e-06, "loss": 1.1121, "step": 9094 }, { "epoch": 0.27, "learning_rate": 4.259252058791487e-06, "loss": 1.0425, "step": 9095 }, { "epoch": 0.27, "learning_rate": 4.259078746099123e-06, "loss": 1.1191, "step": 9096 }, { "epoch": 0.27, "learning_rate": 4.258905416661178e-06, "loss": 1.0747, "step": 9097 }, { "epoch": 0.27, "learning_rate": 4.2587320704793004e-06, "loss": 1.1581, "step": 9098 }, { "epoch": 0.27, "learning_rate": 4.258558707555141e-06, "loss": 1.1127, "step": 9099 }, { "epoch": 0.27, "learning_rate": 4.258385327890347e-06, "loss": 1.1089, "step": 9100 }, { "epoch": 0.27, "learning_rate": 4.258211931486574e-06, "loss": 1.0906, "step": 9101 }, { "epoch": 0.27, "learning_rate": 4.25803851834547e-06, "loss": 1.1379, "step": 9102 }, { "epoch": 0.27, "learning_rate": 4.257865088468685e-06, "loss": 1.1351, "step": 9103 }, { "epoch": 0.27, "learning_rate": 4.257691641857872e-06, "loss": 1.3016, "step": 9104 }, { "epoch": 0.27, "learning_rate": 4.25751817851468e-06, "loss": 1.132, "step": 9105 }, { "epoch": 0.27, "learning_rate": 4.257344698440763e-06, "loss": 1.3187, "step": 9106 }, { "epoch": 0.27, "learning_rate": 4.257171201637769e-06, "loss": 1.1719, "step": 9107 }, { "epoch": 0.27, "learning_rate": 4.256997688107353e-06, "loss": 1.0947, "step": 9108 }, { "epoch": 0.27, "learning_rate": 4.256824157851165e-06, "loss": 1.16, "step": 9109 }, { "epoch": 0.27, "learning_rate": 4.256650610870856e-06, "loss": 1.1783, "step": 9110 }, { "epoch": 0.27, "learning_rate": 4.25647704716808e-06, "loss": 1.1891, "step": 9111 }, { "epoch": 0.27, "learning_rate": 4.256303466744488e-06, "loss": 1.1434, "step": 9112 }, { "epoch": 0.27, "learning_rate": 4.2561298696017335e-06, "loss": 1.0225, "step": 9113 }, { "epoch": 0.27, "learning_rate": 4.255956255741468e-06, "loss": 1.1446, "step": 9114 }, { "epoch": 0.27, "learning_rate": 4.255782625165344e-06, "loss": 1.0974, "step": 9115 }, { "epoch": 0.27, "learning_rate": 4.255608977875017e-06, "loss": 1.1227, "step": 9116 }, { "epoch": 0.27, "learning_rate": 4.255435313872137e-06, "loss": 1.1554, "step": 9117 }, { "epoch": 0.27, "learning_rate": 4.255261633158358e-06, "loss": 1.2535, "step": 9118 }, { "epoch": 0.27, "learning_rate": 4.255087935735334e-06, "loss": 1.1719, "step": 9119 }, { "epoch": 0.27, "learning_rate": 4.254914221604717e-06, "loss": 1.1747, "step": 9120 }, { "epoch": 0.27, "learning_rate": 4.254740490768163e-06, "loss": 1.1855, "step": 9121 }, { "epoch": 0.27, "learning_rate": 4.254566743227324e-06, "loss": 1.1934, "step": 9122 }, { "epoch": 0.27, "learning_rate": 4.254392978983856e-06, "loss": 1.1425, "step": 9123 }, { "epoch": 0.27, "learning_rate": 4.25421919803941e-06, "loss": 1.1441, "step": 9124 }, { "epoch": 0.27, "learning_rate": 4.254045400395643e-06, "loss": 1.2937, "step": 9125 }, { "epoch": 0.27, "learning_rate": 4.253871586054208e-06, "loss": 1.1622, "step": 9126 }, { "epoch": 0.27, "learning_rate": 4.253697755016761e-06, "loss": 1.0698, "step": 9127 }, { "epoch": 0.27, "learning_rate": 4.253523907284955e-06, "loss": 1.1245, "step": 9128 }, { "epoch": 0.28, "learning_rate": 4.253350042860447e-06, "loss": 1.1266, "step": 9129 }, { "epoch": 0.28, "learning_rate": 4.2531761617448905e-06, "loss": 1.1508, "step": 9130 }, { "epoch": 0.28, "learning_rate": 4.253002263939941e-06, "loss": 1.0375, "step": 9131 }, { "epoch": 0.28, "learning_rate": 4.252828349447254e-06, "loss": 1.0809, "step": 9132 }, { "epoch": 0.28, "learning_rate": 4.252654418268486e-06, "loss": 1.1693, "step": 9133 }, { "epoch": 0.28, "learning_rate": 4.252480470405293e-06, "loss": 1.1314, "step": 9134 }, { "epoch": 0.28, "learning_rate": 4.252306505859329e-06, "loss": 1.1212, "step": 9135 }, { "epoch": 0.28, "learning_rate": 4.25213252463225e-06, "loss": 1.1931, "step": 9136 }, { "epoch": 0.28, "learning_rate": 4.251958526725714e-06, "loss": 1.2158, "step": 9137 }, { "epoch": 0.28, "learning_rate": 4.251784512141377e-06, "loss": 1.0739, "step": 9138 }, { "epoch": 0.28, "learning_rate": 4.251610480880895e-06, "loss": 1.0658, "step": 9139 }, { "epoch": 0.28, "learning_rate": 4.2514364329459246e-06, "loss": 1.2128, "step": 9140 }, { "epoch": 0.28, "learning_rate": 4.251262368338123e-06, "loss": 1.1531, "step": 9141 }, { "epoch": 0.28, "learning_rate": 4.251088287059146e-06, "loss": 1.1635, "step": 9142 }, { "epoch": 0.28, "learning_rate": 4.250914189110653e-06, "loss": 1.1857, "step": 9143 }, { "epoch": 0.28, "learning_rate": 4.250740074494301e-06, "loss": 1.121, "step": 9144 }, { "epoch": 0.28, "learning_rate": 4.250565943211745e-06, "loss": 1.1317, "step": 9145 }, { "epoch": 0.28, "learning_rate": 4.250391795264645e-06, "loss": 1.1208, "step": 9146 }, { "epoch": 0.28, "learning_rate": 4.250217630654658e-06, "loss": 1.0257, "step": 9147 }, { "epoch": 0.28, "learning_rate": 4.250043449383443e-06, "loss": 1.204, "step": 9148 }, { "epoch": 0.28, "learning_rate": 4.249869251452656e-06, "loss": 1.0646, "step": 9149 }, { "epoch": 0.28, "learning_rate": 4.249695036863957e-06, "loss": 1.13, "step": 9150 }, { "epoch": 0.28, "learning_rate": 4.249520805619004e-06, "loss": 1.173, "step": 9151 }, { "epoch": 0.28, "learning_rate": 4.249346557719456e-06, "loss": 1.1979, "step": 9152 }, { "epoch": 0.28, "learning_rate": 4.24917229316697e-06, "loss": 1.0582, "step": 9153 }, { "epoch": 0.28, "learning_rate": 4.248998011963207e-06, "loss": 1.1412, "step": 9154 }, { "epoch": 0.28, "learning_rate": 4.248823714109826e-06, "loss": 1.2095, "step": 9155 }, { "epoch": 0.28, "learning_rate": 4.2486493996084835e-06, "loss": 1.187, "step": 9156 }, { "epoch": 0.28, "learning_rate": 4.2484750684608425e-06, "loss": 1.1734, "step": 9157 }, { "epoch": 0.28, "learning_rate": 4.24830072066856e-06, "loss": 1.226, "step": 9158 }, { "epoch": 0.28, "learning_rate": 4.248126356233298e-06, "loss": 1.082, "step": 9159 }, { "epoch": 0.28, "learning_rate": 4.247951975156714e-06, "loss": 1.2894, "step": 9160 }, { "epoch": 0.28, "learning_rate": 4.247777577440469e-06, "loss": 1.1021, "step": 9161 }, { "epoch": 0.28, "learning_rate": 4.247603163086223e-06, "loss": 1.3279, "step": 9162 }, { "epoch": 0.28, "learning_rate": 4.2474287320956375e-06, "loss": 1.0712, "step": 9163 }, { "epoch": 0.28, "learning_rate": 4.2472542844703715e-06, "loss": 1.1142, "step": 9164 }, { "epoch": 0.28, "learning_rate": 4.2470798202120865e-06, "loss": 1.1107, "step": 9165 }, { "epoch": 0.28, "learning_rate": 4.2469053393224425e-06, "loss": 1.1257, "step": 9166 }, { "epoch": 0.28, "learning_rate": 4.2467308418031015e-06, "loss": 1.2107, "step": 9167 }, { "epoch": 0.28, "learning_rate": 4.246556327655724e-06, "loss": 1.2349, "step": 9168 }, { "epoch": 0.28, "learning_rate": 4.246381796881971e-06, "loss": 1.1436, "step": 9169 }, { "epoch": 0.28, "learning_rate": 4.246207249483505e-06, "loss": 1.1736, "step": 9170 }, { "epoch": 0.28, "learning_rate": 4.246032685461987e-06, "loss": 1.1826, "step": 9171 }, { "epoch": 0.28, "learning_rate": 4.245858104819078e-06, "loss": 1.2527, "step": 9172 }, { "epoch": 0.28, "learning_rate": 4.245683507556442e-06, "loss": 1.2059, "step": 9173 }, { "epoch": 0.28, "learning_rate": 4.2455088936757386e-06, "loss": 1.2365, "step": 9174 }, { "epoch": 0.28, "learning_rate": 4.245334263178632e-06, "loss": 1.0474, "step": 9175 }, { "epoch": 0.28, "learning_rate": 4.245159616066783e-06, "loss": 1.1465, "step": 9176 }, { "epoch": 0.28, "learning_rate": 4.244984952341855e-06, "loss": 1.1327, "step": 9177 }, { "epoch": 0.28, "learning_rate": 4.24481027200551e-06, "loss": 1.1014, "step": 9178 }, { "epoch": 0.28, "learning_rate": 4.244635575059413e-06, "loss": 1.239, "step": 9179 }, { "epoch": 0.28, "learning_rate": 4.2444608615052255e-06, "loss": 1.124, "step": 9180 }, { "epoch": 0.28, "learning_rate": 4.24428613134461e-06, "loss": 1.1716, "step": 9181 }, { "epoch": 0.28, "learning_rate": 4.244111384579231e-06, "loss": 1.0927, "step": 9182 }, { "epoch": 0.28, "learning_rate": 4.243936621210751e-06, "loss": 1.2324, "step": 9183 }, { "epoch": 0.28, "learning_rate": 4.243761841240835e-06, "loss": 1.2161, "step": 9184 }, { "epoch": 0.28, "learning_rate": 4.243587044671147e-06, "loss": 1.1884, "step": 9185 }, { "epoch": 0.28, "learning_rate": 4.243412231503348e-06, "loss": 1.2113, "step": 9186 }, { "epoch": 0.28, "learning_rate": 4.243237401739106e-06, "loss": 1.2427, "step": 9187 }, { "epoch": 0.28, "learning_rate": 4.243062555380082e-06, "loss": 1.0549, "step": 9188 }, { "epoch": 0.28, "learning_rate": 4.2428876924279425e-06, "loss": 1.0718, "step": 9189 }, { "epoch": 0.28, "learning_rate": 4.242712812884353e-06, "loss": 1.0838, "step": 9190 }, { "epoch": 0.28, "learning_rate": 4.242537916750975e-06, "loss": 1.1429, "step": 9191 }, { "epoch": 0.28, "learning_rate": 4.242363004029476e-06, "loss": 1.1209, "step": 9192 }, { "epoch": 0.28, "learning_rate": 4.242188074721521e-06, "loss": 1.2086, "step": 9193 }, { "epoch": 0.28, "learning_rate": 4.242013128828773e-06, "loss": 1.1818, "step": 9194 }, { "epoch": 0.28, "learning_rate": 4.2418381663529e-06, "loss": 1.1882, "step": 9195 }, { "epoch": 0.28, "learning_rate": 4.241663187295566e-06, "loss": 1.1119, "step": 9196 }, { "epoch": 0.28, "learning_rate": 4.241488191658438e-06, "loss": 1.2108, "step": 9197 }, { "epoch": 0.28, "learning_rate": 4.24131317944318e-06, "loss": 1.1526, "step": 9198 }, { "epoch": 0.28, "learning_rate": 4.24113815065146e-06, "loss": 1.0762, "step": 9199 }, { "epoch": 0.28, "learning_rate": 4.240963105284944e-06, "loss": 1.1628, "step": 9200 }, { "epoch": 0.28, "learning_rate": 4.240788043345297e-06, "loss": 1.1305, "step": 9201 }, { "epoch": 0.28, "learning_rate": 4.240612964834186e-06, "loss": 1.1107, "step": 9202 }, { "epoch": 0.28, "learning_rate": 4.240437869753278e-06, "loss": 1.1479, "step": 9203 }, { "epoch": 0.28, "learning_rate": 4.24026275810424e-06, "loss": 1.1901, "step": 9204 }, { "epoch": 0.28, "learning_rate": 4.2400876298887385e-06, "loss": 1.2133, "step": 9205 }, { "epoch": 0.28, "learning_rate": 4.239912485108441e-06, "loss": 1.2867, "step": 9206 }, { "epoch": 0.28, "learning_rate": 4.239737323765014e-06, "loss": 1.1246, "step": 9207 }, { "epoch": 0.28, "learning_rate": 4.239562145860127e-06, "loss": 1.1573, "step": 9208 }, { "epoch": 0.28, "learning_rate": 4.239386951395444e-06, "loss": 1.0364, "step": 9209 }, { "epoch": 0.28, "learning_rate": 4.239211740372637e-06, "loss": 1.1082, "step": 9210 }, { "epoch": 0.28, "learning_rate": 4.239036512793371e-06, "loss": 1.1174, "step": 9211 }, { "epoch": 0.28, "learning_rate": 4.238861268659314e-06, "loss": 1.1163, "step": 9212 }, { "epoch": 0.28, "learning_rate": 4.238686007972137e-06, "loss": 1.0699, "step": 9213 }, { "epoch": 0.28, "learning_rate": 4.238510730733506e-06, "loss": 1.121, "step": 9214 }, { "epoch": 0.28, "learning_rate": 4.238335436945089e-06, "loss": 1.0043, "step": 9215 }, { "epoch": 0.28, "learning_rate": 4.238160126608557e-06, "loss": 1.1876, "step": 9216 }, { "epoch": 0.28, "learning_rate": 4.237984799725577e-06, "loss": 1.1567, "step": 9217 }, { "epoch": 0.28, "learning_rate": 4.23780945629782e-06, "loss": 1.2299, "step": 9218 }, { "epoch": 0.28, "learning_rate": 4.237634096326952e-06, "loss": 1.0941, "step": 9219 }, { "epoch": 0.28, "learning_rate": 4.237458719814646e-06, "loss": 1.111, "step": 9220 }, { "epoch": 0.28, "learning_rate": 4.237283326762569e-06, "loss": 1.116, "step": 9221 }, { "epoch": 0.28, "learning_rate": 4.237107917172392e-06, "loss": 1.0543, "step": 9222 }, { "epoch": 0.28, "learning_rate": 4.236932491045784e-06, "loss": 1.1297, "step": 9223 }, { "epoch": 0.28, "learning_rate": 4.236757048384415e-06, "loss": 1.134, "step": 9224 }, { "epoch": 0.28, "learning_rate": 4.236581589189955e-06, "loss": 1.0781, "step": 9225 }, { "epoch": 0.28, "learning_rate": 4.236406113464075e-06, "loss": 1.1074, "step": 9226 }, { "epoch": 0.28, "learning_rate": 4.236230621208446e-06, "loss": 1.0931, "step": 9227 }, { "epoch": 0.28, "learning_rate": 4.236055112424736e-06, "loss": 1.1113, "step": 9228 }, { "epoch": 0.28, "learning_rate": 4.235879587114619e-06, "loss": 1.2054, "step": 9229 }, { "epoch": 0.28, "learning_rate": 4.235704045279762e-06, "loss": 1.1447, "step": 9230 }, { "epoch": 0.28, "learning_rate": 4.235528486921842e-06, "loss": 1.082, "step": 9231 }, { "epoch": 0.28, "learning_rate": 4.235352912042524e-06, "loss": 1.0418, "step": 9232 }, { "epoch": 0.28, "learning_rate": 4.235177320643483e-06, "loss": 1.1235, "step": 9233 }, { "epoch": 0.28, "learning_rate": 4.235001712726389e-06, "loss": 1.0194, "step": 9234 }, { "epoch": 0.28, "learning_rate": 4.2348260882929144e-06, "loss": 1.2351, "step": 9235 }, { "epoch": 0.28, "learning_rate": 4.234650447344731e-06, "loss": 1.2191, "step": 9236 }, { "epoch": 0.28, "learning_rate": 4.234474789883511e-06, "loss": 1.2135, "step": 9237 }, { "epoch": 0.28, "learning_rate": 4.234299115910927e-06, "loss": 1.0994, "step": 9238 }, { "epoch": 0.28, "learning_rate": 4.23412342542865e-06, "loss": 1.0598, "step": 9239 }, { "epoch": 0.28, "learning_rate": 4.233947718438353e-06, "loss": 1.0932, "step": 9240 }, { "epoch": 0.28, "learning_rate": 4.233771994941709e-06, "loss": 1.064, "step": 9241 }, { "epoch": 0.28, "learning_rate": 4.233596254940391e-06, "loss": 1.1763, "step": 9242 }, { "epoch": 0.28, "learning_rate": 4.233420498436071e-06, "loss": 0.9941, "step": 9243 }, { "epoch": 0.28, "learning_rate": 4.233244725430423e-06, "loss": 1.0939, "step": 9244 }, { "epoch": 0.28, "learning_rate": 4.23306893592512e-06, "loss": 1.2003, "step": 9245 }, { "epoch": 0.28, "learning_rate": 4.232893129921835e-06, "loss": 1.1528, "step": 9246 }, { "epoch": 0.28, "learning_rate": 4.232717307422243e-06, "loss": 1.1725, "step": 9247 }, { "epoch": 0.28, "learning_rate": 4.232541468428016e-06, "loss": 1.0854, "step": 9248 }, { "epoch": 0.28, "learning_rate": 4.232365612940828e-06, "loss": 1.0851, "step": 9249 }, { "epoch": 0.28, "learning_rate": 4.232189740962354e-06, "loss": 1.1356, "step": 9250 }, { "epoch": 0.28, "learning_rate": 4.232013852494269e-06, "loss": 1.1495, "step": 9251 }, { "epoch": 0.28, "learning_rate": 4.231837947538246e-06, "loss": 1.1627, "step": 9252 }, { "epoch": 0.28, "learning_rate": 4.231662026095958e-06, "loss": 1.2831, "step": 9253 }, { "epoch": 0.28, "learning_rate": 4.2314860881690834e-06, "loss": 1.0365, "step": 9254 }, { "epoch": 0.28, "learning_rate": 4.231310133759295e-06, "loss": 1.231, "step": 9255 }, { "epoch": 0.28, "learning_rate": 4.231134162868267e-06, "loss": 1.1218, "step": 9256 }, { "epoch": 0.28, "learning_rate": 4.230958175497677e-06, "loss": 1.1967, "step": 9257 }, { "epoch": 0.28, "learning_rate": 4.230782171649197e-06, "loss": 1.032, "step": 9258 }, { "epoch": 0.28, "learning_rate": 4.2306061513245065e-06, "loss": 1.1338, "step": 9259 }, { "epoch": 0.28, "learning_rate": 4.230430114525277e-06, "loss": 1.0325, "step": 9260 }, { "epoch": 0.28, "learning_rate": 4.2302540612531876e-06, "loss": 1.2405, "step": 9261 }, { "epoch": 0.28, "learning_rate": 4.230077991509911e-06, "loss": 1.1255, "step": 9262 }, { "epoch": 0.28, "learning_rate": 4.229901905297127e-06, "loss": 1.1481, "step": 9263 }, { "epoch": 0.28, "learning_rate": 4.229725802616509e-06, "loss": 1.1282, "step": 9264 }, { "epoch": 0.28, "learning_rate": 4.229549683469735e-06, "loss": 1.1775, "step": 9265 }, { "epoch": 0.28, "learning_rate": 4.229373547858481e-06, "loss": 1.2146, "step": 9266 }, { "epoch": 0.28, "learning_rate": 4.229197395784424e-06, "loss": 1.1249, "step": 9267 }, { "epoch": 0.28, "learning_rate": 4.229021227249239e-06, "loss": 1.2414, "step": 9268 }, { "epoch": 0.28, "learning_rate": 4.228845042254606e-06, "loss": 1.1911, "step": 9269 }, { "epoch": 0.28, "learning_rate": 4.228668840802201e-06, "loss": 1.2068, "step": 9270 }, { "epoch": 0.28, "learning_rate": 4.2284926228937e-06, "loss": 1.0913, "step": 9271 }, { "epoch": 0.28, "learning_rate": 4.228316388530783e-06, "loss": 1.1805, "step": 9272 }, { "epoch": 0.28, "learning_rate": 4.228140137715126e-06, "loss": 1.0383, "step": 9273 }, { "epoch": 0.28, "learning_rate": 4.227963870448406e-06, "loss": 1.0829, "step": 9274 }, { "epoch": 0.28, "learning_rate": 4.227787586732304e-06, "loss": 1.1855, "step": 9275 }, { "epoch": 0.28, "learning_rate": 4.227611286568495e-06, "loss": 1.1298, "step": 9276 }, { "epoch": 0.28, "learning_rate": 4.227434969958659e-06, "loss": 1.0814, "step": 9277 }, { "epoch": 0.28, "learning_rate": 4.227258636904474e-06, "loss": 1.113, "step": 9278 }, { "epoch": 0.28, "learning_rate": 4.227082287407619e-06, "loss": 1.2649, "step": 9279 }, { "epoch": 0.28, "learning_rate": 4.226905921469772e-06, "loss": 1.1146, "step": 9280 }, { "epoch": 0.28, "learning_rate": 4.226729539092613e-06, "loss": 1.1687, "step": 9281 }, { "epoch": 0.28, "learning_rate": 4.226553140277819e-06, "loss": 1.0172, "step": 9282 }, { "epoch": 0.28, "learning_rate": 4.226376725027072e-06, "loss": 1.1956, "step": 9283 }, { "epoch": 0.28, "learning_rate": 4.22620029334205e-06, "loss": 1.1105, "step": 9284 }, { "epoch": 0.28, "learning_rate": 4.226023845224431e-06, "loss": 1.1999, "step": 9285 }, { "epoch": 0.28, "learning_rate": 4.225847380675898e-06, "loss": 1.1483, "step": 9286 }, { "epoch": 0.28, "learning_rate": 4.225670899698128e-06, "loss": 1.2228, "step": 9287 }, { "epoch": 0.28, "learning_rate": 4.2254944022928035e-06, "loss": 1.1511, "step": 9288 }, { "epoch": 0.28, "learning_rate": 4.225317888461602e-06, "loss": 1.2206, "step": 9289 }, { "epoch": 0.28, "learning_rate": 4.225141358206206e-06, "loss": 1.1255, "step": 9290 }, { "epoch": 0.28, "learning_rate": 4.224964811528295e-06, "loss": 1.1154, "step": 9291 }, { "epoch": 0.28, "learning_rate": 4.22478824842955e-06, "loss": 1.0958, "step": 9292 }, { "epoch": 0.28, "learning_rate": 4.22461166891165e-06, "loss": 1.1422, "step": 9293 }, { "epoch": 0.28, "learning_rate": 4.22443507297628e-06, "loss": 1.0963, "step": 9294 }, { "epoch": 0.28, "learning_rate": 4.224258460625117e-06, "loss": 1.3002, "step": 9295 }, { "epoch": 0.28, "learning_rate": 4.224081831859844e-06, "loss": 1.0966, "step": 9296 }, { "epoch": 0.28, "learning_rate": 4.223905186682142e-06, "loss": 1.1785, "step": 9297 }, { "epoch": 0.28, "learning_rate": 4.223728525093694e-06, "loss": 1.1704, "step": 9298 }, { "epoch": 0.28, "learning_rate": 4.22355184709618e-06, "loss": 1.131, "step": 9299 }, { "epoch": 0.28, "learning_rate": 4.223375152691283e-06, "loss": 1.178, "step": 9300 }, { "epoch": 0.28, "learning_rate": 4.223198441880683e-06, "loss": 1.078, "step": 9301 }, { "epoch": 0.28, "learning_rate": 4.223021714666064e-06, "loss": 1.1912, "step": 9302 }, { "epoch": 0.28, "learning_rate": 4.2228449710491095e-06, "loss": 1.0383, "step": 9303 }, { "epoch": 0.28, "learning_rate": 4.2226682110315e-06, "loss": 1.1554, "step": 9304 }, { "epoch": 0.28, "learning_rate": 4.2224914346149195e-06, "loss": 1.2576, "step": 9305 }, { "epoch": 0.28, "learning_rate": 4.2223146418010495e-06, "loss": 1.1466, "step": 9306 }, { "epoch": 0.28, "learning_rate": 4.222137832591573e-06, "loss": 1.0541, "step": 9307 }, { "epoch": 0.28, "learning_rate": 4.221961006988175e-06, "loss": 1.1116, "step": 9308 }, { "epoch": 0.28, "learning_rate": 4.221784164992536e-06, "loss": 0.9911, "step": 9309 }, { "epoch": 0.28, "learning_rate": 4.221607306606342e-06, "loss": 1.0479, "step": 9310 }, { "epoch": 0.28, "learning_rate": 4.221430431831276e-06, "loss": 1.2207, "step": 9311 }, { "epoch": 0.28, "learning_rate": 4.221253540669021e-06, "loss": 1.1879, "step": 9312 }, { "epoch": 0.28, "learning_rate": 4.221076633121261e-06, "loss": 1.1925, "step": 9313 }, { "epoch": 0.28, "learning_rate": 4.22089970918968e-06, "loss": 1.1411, "step": 9314 }, { "epoch": 0.28, "learning_rate": 4.220722768875962e-06, "loss": 0.9876, "step": 9315 }, { "epoch": 0.28, "learning_rate": 4.220545812181794e-06, "loss": 1.1955, "step": 9316 }, { "epoch": 0.28, "learning_rate": 4.220368839108857e-06, "loss": 1.1343, "step": 9317 }, { "epoch": 0.28, "learning_rate": 4.220191849658838e-06, "loss": 1.2232, "step": 9318 }, { "epoch": 0.28, "learning_rate": 4.22001484383342e-06, "loss": 1.1001, "step": 9319 }, { "epoch": 0.28, "learning_rate": 4.21983782163429e-06, "loss": 1.0305, "step": 9320 }, { "epoch": 0.28, "learning_rate": 4.219660783063132e-06, "loss": 1.1042, "step": 9321 }, { "epoch": 0.28, "learning_rate": 4.2194837281216325e-06, "loss": 1.0952, "step": 9322 }, { "epoch": 0.28, "learning_rate": 4.2193066568114745e-06, "loss": 1.1996, "step": 9323 }, { "epoch": 0.28, "learning_rate": 4.219129569134346e-06, "loss": 1.1866, "step": 9324 }, { "epoch": 0.28, "learning_rate": 4.2189524650919315e-06, "loss": 1.1452, "step": 9325 }, { "epoch": 0.28, "learning_rate": 4.2187753446859185e-06, "loss": 1.1379, "step": 9326 }, { "epoch": 0.28, "learning_rate": 4.218598207917991e-06, "loss": 1.2549, "step": 9327 }, { "epoch": 0.28, "learning_rate": 4.218421054789837e-06, "loss": 1.1848, "step": 9328 }, { "epoch": 0.28, "learning_rate": 4.218243885303141e-06, "loss": 1.172, "step": 9329 }, { "epoch": 0.28, "learning_rate": 4.218066699459591e-06, "loss": 1.3326, "step": 9330 }, { "epoch": 0.28, "learning_rate": 4.2178894972608745e-06, "loss": 1.2382, "step": 9331 }, { "epoch": 0.28, "learning_rate": 4.217712278708676e-06, "loss": 1.1544, "step": 9332 }, { "epoch": 0.28, "learning_rate": 4.217535043804685e-06, "loss": 1.1927, "step": 9333 }, { "epoch": 0.28, "learning_rate": 4.217357792550587e-06, "loss": 1.0485, "step": 9334 }, { "epoch": 0.28, "learning_rate": 4.2171805249480705e-06, "loss": 1.0505, "step": 9335 }, { "epoch": 0.28, "learning_rate": 4.217003240998822e-06, "loss": 1.162, "step": 9336 }, { "epoch": 0.28, "learning_rate": 4.2168259407045295e-06, "loss": 1.2578, "step": 9337 }, { "epoch": 0.28, "learning_rate": 4.216648624066881e-06, "loss": 1.1629, "step": 9338 }, { "epoch": 0.28, "learning_rate": 4.216471291087564e-06, "loss": 1.0748, "step": 9339 }, { "epoch": 0.28, "learning_rate": 4.216293941768267e-06, "loss": 1.1076, "step": 9340 }, { "epoch": 0.28, "learning_rate": 4.216116576110679e-06, "loss": 1.1149, "step": 9341 }, { "epoch": 0.28, "learning_rate": 4.215939194116488e-06, "loss": 1.0906, "step": 9342 }, { "epoch": 0.28, "learning_rate": 4.215761795787381e-06, "loss": 1.129, "step": 9343 }, { "epoch": 0.28, "learning_rate": 4.215584381125048e-06, "loss": 1.1742, "step": 9344 }, { "epoch": 0.28, "learning_rate": 4.215406950131179e-06, "loss": 1.1781, "step": 9345 }, { "epoch": 0.28, "learning_rate": 4.215229502807462e-06, "loss": 1.1214, "step": 9346 }, { "epoch": 0.28, "learning_rate": 4.215052039155586e-06, "loss": 1.2596, "step": 9347 }, { "epoch": 0.28, "learning_rate": 4.21487455917724e-06, "loss": 1.204, "step": 9348 }, { "epoch": 0.28, "learning_rate": 4.2146970628741145e-06, "loss": 1.1741, "step": 9349 }, { "epoch": 0.28, "learning_rate": 4.2145195502478995e-06, "loss": 1.0093, "step": 9350 }, { "epoch": 0.28, "learning_rate": 4.214342021300283e-06, "loss": 1.1036, "step": 9351 }, { "epoch": 0.28, "learning_rate": 4.214164476032957e-06, "loss": 1.2675, "step": 9352 }, { "epoch": 0.28, "learning_rate": 4.21398691444761e-06, "loss": 1.2101, "step": 9353 }, { "epoch": 0.28, "learning_rate": 4.213809336545933e-06, "loss": 1.1755, "step": 9354 }, { "epoch": 0.28, "learning_rate": 4.213631742329617e-06, "loss": 1.1916, "step": 9355 }, { "epoch": 0.28, "learning_rate": 4.213454131800352e-06, "loss": 1.1865, "step": 9356 }, { "epoch": 0.28, "learning_rate": 4.213276504959829e-06, "loss": 1.0928, "step": 9357 }, { "epoch": 0.28, "learning_rate": 4.213098861809739e-06, "loss": 1.1315, "step": 9358 }, { "epoch": 0.28, "learning_rate": 4.212921202351772e-06, "loss": 1.1472, "step": 9359 }, { "epoch": 0.28, "learning_rate": 4.212743526587621e-06, "loss": 1.1476, "step": 9360 }, { "epoch": 0.28, "learning_rate": 4.212565834518977e-06, "loss": 1.1639, "step": 9361 }, { "epoch": 0.28, "learning_rate": 4.2123881261475294e-06, "loss": 1.3049, "step": 9362 }, { "epoch": 0.28, "learning_rate": 4.212210401474973e-06, "loss": 1.113, "step": 9363 }, { "epoch": 0.28, "learning_rate": 4.212032660502997e-06, "loss": 1.1938, "step": 9364 }, { "epoch": 0.28, "learning_rate": 4.211854903233296e-06, "loss": 1.1043, "step": 9365 }, { "epoch": 0.28, "learning_rate": 4.2116771296675596e-06, "loss": 1.1241, "step": 9366 }, { "epoch": 0.28, "learning_rate": 4.211499339807482e-06, "loss": 1.1664, "step": 9367 }, { "epoch": 0.28, "learning_rate": 4.211321533654755e-06, "loss": 1.1418, "step": 9368 }, { "epoch": 0.28, "learning_rate": 4.2111437112110705e-06, "loss": 1.0926, "step": 9369 }, { "epoch": 0.28, "learning_rate": 4.210965872478122e-06, "loss": 1.0731, "step": 9370 }, { "epoch": 0.28, "learning_rate": 4.210788017457603e-06, "loss": 1.1329, "step": 9371 }, { "epoch": 0.28, "learning_rate": 4.2106101461512065e-06, "loss": 1.131, "step": 9372 }, { "epoch": 0.28, "learning_rate": 4.210432258560624e-06, "loss": 1.0995, "step": 9373 }, { "epoch": 0.28, "learning_rate": 4.210254354687551e-06, "loss": 1.1938, "step": 9374 }, { "epoch": 0.28, "learning_rate": 4.2100764345336795e-06, "loss": 1.0823, "step": 9375 }, { "epoch": 0.28, "learning_rate": 4.209898498100705e-06, "loss": 1.1559, "step": 9376 }, { "epoch": 0.28, "learning_rate": 4.20972054539032e-06, "loss": 1.0825, "step": 9377 }, { "epoch": 0.28, "learning_rate": 4.209542576404219e-06, "loss": 1.1638, "step": 9378 }, { "epoch": 0.28, "learning_rate": 4.209364591144095e-06, "loss": 1.2162, "step": 9379 }, { "epoch": 0.28, "learning_rate": 4.209186589611644e-06, "loss": 1.2809, "step": 9380 }, { "epoch": 0.28, "learning_rate": 4.2090085718085596e-06, "loss": 1.0204, "step": 9381 }, { "epoch": 0.28, "learning_rate": 4.208830537736537e-06, "loss": 1.2515, "step": 9382 }, { "epoch": 0.28, "learning_rate": 4.208652487397271e-06, "loss": 1.1735, "step": 9383 }, { "epoch": 0.28, "learning_rate": 4.208474420792456e-06, "loss": 1.1054, "step": 9384 }, { "epoch": 0.28, "learning_rate": 4.208296337923787e-06, "loss": 1.1937, "step": 9385 }, { "epoch": 0.28, "learning_rate": 4.208118238792959e-06, "loss": 1.1417, "step": 9386 }, { "epoch": 0.28, "learning_rate": 4.207940123401669e-06, "loss": 1.2353, "step": 9387 }, { "epoch": 0.28, "learning_rate": 4.207761991751612e-06, "loss": 1.1452, "step": 9388 }, { "epoch": 0.28, "learning_rate": 4.207583843844483e-06, "loss": 1.1753, "step": 9389 }, { "epoch": 0.28, "learning_rate": 4.207405679681977e-06, "loss": 1.0776, "step": 9390 }, { "epoch": 0.28, "learning_rate": 4.207227499265792e-06, "loss": 1.2309, "step": 9391 }, { "epoch": 0.28, "learning_rate": 4.207049302597624e-06, "loss": 1.1735, "step": 9392 }, { "epoch": 0.28, "learning_rate": 4.206871089679169e-06, "loss": 1.2926, "step": 9393 }, { "epoch": 0.28, "learning_rate": 4.206692860512122e-06, "loss": 1.1183, "step": 9394 }, { "epoch": 0.28, "learning_rate": 4.206514615098182e-06, "loss": 1.1786, "step": 9395 }, { "epoch": 0.28, "learning_rate": 4.206336353439044e-06, "loss": 1.0602, "step": 9396 }, { "epoch": 0.28, "learning_rate": 4.206158075536407e-06, "loss": 1.1582, "step": 9397 }, { "epoch": 0.28, "learning_rate": 4.205979781391965e-06, "loss": 1.1841, "step": 9398 }, { "epoch": 0.28, "learning_rate": 4.205801471007418e-06, "loss": 1.2051, "step": 9399 }, { "epoch": 0.28, "learning_rate": 4.205623144384463e-06, "loss": 1.0283, "step": 9400 }, { "epoch": 0.28, "learning_rate": 4.205444801524796e-06, "loss": 1.1307, "step": 9401 }, { "epoch": 0.28, "learning_rate": 4.205266442430117e-06, "loss": 1.145, "step": 9402 }, { "epoch": 0.28, "learning_rate": 4.205088067102122e-06, "loss": 1.0811, "step": 9403 }, { "epoch": 0.28, "learning_rate": 4.204909675542511e-06, "loss": 1.0684, "step": 9404 }, { "epoch": 0.28, "learning_rate": 4.20473126775298e-06, "loss": 1.1929, "step": 9405 }, { "epoch": 0.28, "learning_rate": 4.204552843735228e-06, "loss": 1.2535, "step": 9406 }, { "epoch": 0.28, "learning_rate": 4.204374403490954e-06, "loss": 1.0959, "step": 9407 }, { "epoch": 0.28, "learning_rate": 4.204195947021857e-06, "loss": 1.2095, "step": 9408 }, { "epoch": 0.28, "learning_rate": 4.204017474329635e-06, "loss": 1.043, "step": 9409 }, { "epoch": 0.28, "learning_rate": 4.203838985415988e-06, "loss": 1.2493, "step": 9410 }, { "epoch": 0.28, "learning_rate": 4.203660480282614e-06, "loss": 1.1151, "step": 9411 }, { "epoch": 0.28, "learning_rate": 4.203481958931212e-06, "loss": 1.1368, "step": 9412 }, { "epoch": 0.28, "learning_rate": 4.2033034213634835e-06, "loss": 1.3265, "step": 9413 }, { "epoch": 0.28, "learning_rate": 4.203124867581126e-06, "loss": 1.1797, "step": 9414 }, { "epoch": 0.28, "learning_rate": 4.202946297585841e-06, "loss": 1.0826, "step": 9415 }, { "epoch": 0.28, "learning_rate": 4.202767711379326e-06, "loss": 1.1241, "step": 9416 }, { "epoch": 0.28, "learning_rate": 4.202589108963283e-06, "loss": 1.2066, "step": 9417 }, { "epoch": 0.28, "learning_rate": 4.2024104903394115e-06, "loss": 1.1207, "step": 9418 }, { "epoch": 0.28, "learning_rate": 4.202231855509413e-06, "loss": 1.1179, "step": 9419 }, { "epoch": 0.28, "learning_rate": 4.202053204474986e-06, "loss": 1.1418, "step": 9420 }, { "epoch": 0.28, "learning_rate": 4.201874537237832e-06, "loss": 1.1542, "step": 9421 }, { "epoch": 0.28, "learning_rate": 4.201695853799653e-06, "loss": 1.1761, "step": 9422 }, { "epoch": 0.28, "learning_rate": 4.201517154162149e-06, "loss": 1.093, "step": 9423 }, { "epoch": 0.28, "learning_rate": 4.201338438327021e-06, "loss": 1.1858, "step": 9424 }, { "epoch": 0.28, "learning_rate": 4.20115970629597e-06, "loss": 1.1263, "step": 9425 }, { "epoch": 0.28, "learning_rate": 4.200980958070698e-06, "loss": 1.1528, "step": 9426 }, { "epoch": 0.28, "learning_rate": 4.200802193652906e-06, "loss": 1.0629, "step": 9427 }, { "epoch": 0.28, "learning_rate": 4.200623413044298e-06, "loss": 1.1146, "step": 9428 }, { "epoch": 0.28, "learning_rate": 4.200444616246573e-06, "loss": 1.1406, "step": 9429 }, { "epoch": 0.28, "learning_rate": 4.200265803261434e-06, "loss": 1.2198, "step": 9430 }, { "epoch": 0.28, "learning_rate": 4.200086974090584e-06, "loss": 1.0417, "step": 9431 }, { "epoch": 0.28, "learning_rate": 4.199908128735724e-06, "loss": 1.1625, "step": 9432 }, { "epoch": 0.28, "learning_rate": 4.199729267198558e-06, "loss": 1.1258, "step": 9433 }, { "epoch": 0.28, "learning_rate": 4.1995503894807885e-06, "loss": 1.0349, "step": 9434 }, { "epoch": 0.28, "learning_rate": 4.199371495584117e-06, "loss": 1.1698, "step": 9435 }, { "epoch": 0.28, "learning_rate": 4.199192585510248e-06, "loss": 1.1289, "step": 9436 }, { "epoch": 0.28, "learning_rate": 4.199013659260883e-06, "loss": 1.1688, "step": 9437 }, { "epoch": 0.28, "learning_rate": 4.198834716837726e-06, "loss": 1.1608, "step": 9438 }, { "epoch": 0.28, "learning_rate": 4.198655758242482e-06, "loss": 1.1514, "step": 9439 }, { "epoch": 0.28, "learning_rate": 4.198476783476852e-06, "loss": 1.1687, "step": 9440 }, { "epoch": 0.28, "learning_rate": 4.198297792542542e-06, "loss": 1.0858, "step": 9441 }, { "epoch": 0.28, "learning_rate": 4.1981187854412546e-06, "loss": 1.1406, "step": 9442 }, { "epoch": 0.28, "learning_rate": 4.197939762174694e-06, "loss": 1.0507, "step": 9443 }, { "epoch": 0.28, "learning_rate": 4.197760722744565e-06, "loss": 1.0811, "step": 9444 }, { "epoch": 0.28, "learning_rate": 4.197581667152572e-06, "loss": 1.0782, "step": 9445 }, { "epoch": 0.28, "learning_rate": 4.197402595400418e-06, "loss": 1.1497, "step": 9446 }, { "epoch": 0.28, "learning_rate": 4.1972235074898096e-06, "loss": 1.1617, "step": 9447 }, { "epoch": 0.28, "learning_rate": 4.197044403422451e-06, "loss": 1.0606, "step": 9448 }, { "epoch": 0.28, "learning_rate": 4.196865283200045e-06, "loss": 1.2279, "step": 9449 }, { "epoch": 0.28, "learning_rate": 4.1966861468243015e-06, "loss": 1.0059, "step": 9450 }, { "epoch": 0.28, "learning_rate": 4.196506994296922e-06, "loss": 1.1204, "step": 9451 }, { "epoch": 0.28, "learning_rate": 4.196327825619613e-06, "loss": 1.1208, "step": 9452 }, { "epoch": 0.28, "learning_rate": 4.19614864079408e-06, "loss": 1.2125, "step": 9453 }, { "epoch": 0.28, "learning_rate": 4.1959694398220285e-06, "loss": 1.1949, "step": 9454 }, { "epoch": 0.28, "learning_rate": 4.195790222705165e-06, "loss": 1.1937, "step": 9455 }, { "epoch": 0.28, "learning_rate": 4.1956109894451955e-06, "loss": 1.1432, "step": 9456 }, { "epoch": 0.28, "learning_rate": 4.195431740043825e-06, "loss": 1.0774, "step": 9457 }, { "epoch": 0.28, "learning_rate": 4.195252474502762e-06, "loss": 1.2306, "step": 9458 }, { "epoch": 0.28, "learning_rate": 4.195073192823712e-06, "loss": 1.0118, "step": 9459 }, { "epoch": 0.28, "learning_rate": 4.19489389500838e-06, "loss": 1.1194, "step": 9460 }, { "epoch": 0.29, "learning_rate": 4.194714581058476e-06, "loss": 1.1392, "step": 9461 }, { "epoch": 0.29, "learning_rate": 4.194535250975706e-06, "loss": 1.0731, "step": 9462 }, { "epoch": 0.29, "learning_rate": 4.194355904761774e-06, "loss": 1.1678, "step": 9463 }, { "epoch": 0.29, "learning_rate": 4.194176542418392e-06, "loss": 1.1537, "step": 9464 }, { "epoch": 0.29, "learning_rate": 4.193997163947264e-06, "loss": 1.1704, "step": 9465 }, { "epoch": 0.29, "learning_rate": 4.1938177693501e-06, "loss": 1.2239, "step": 9466 }, { "epoch": 0.29, "learning_rate": 4.193638358628606e-06, "loss": 1.1154, "step": 9467 }, { "epoch": 0.29, "learning_rate": 4.1934589317844905e-06, "loss": 1.1178, "step": 9468 }, { "epoch": 0.29, "learning_rate": 4.1932794888194615e-06, "loss": 1.0642, "step": 9469 }, { "epoch": 0.29, "learning_rate": 4.193100029735228e-06, "loss": 1.1411, "step": 9470 }, { "epoch": 0.29, "learning_rate": 4.192920554533497e-06, "loss": 1.1266, "step": 9471 }, { "epoch": 0.29, "learning_rate": 4.192741063215977e-06, "loss": 1.1064, "step": 9472 }, { "epoch": 0.29, "learning_rate": 4.192561555784378e-06, "loss": 1.2555, "step": 9473 }, { "epoch": 0.29, "learning_rate": 4.192382032240408e-06, "loss": 1.1526, "step": 9474 }, { "epoch": 0.29, "learning_rate": 4.192202492585776e-06, "loss": 1.1285, "step": 9475 }, { "epoch": 0.29, "learning_rate": 4.192022936822192e-06, "loss": 1.1467, "step": 9476 }, { "epoch": 0.29, "learning_rate": 4.191843364951364e-06, "loss": 1.0939, "step": 9477 }, { "epoch": 0.29, "learning_rate": 4.191663776975003e-06, "loss": 1.1002, "step": 9478 }, { "epoch": 0.29, "learning_rate": 4.191484172894816e-06, "loss": 1.1748, "step": 9479 }, { "epoch": 0.29, "learning_rate": 4.191304552712515e-06, "loss": 1.1797, "step": 9480 }, { "epoch": 0.29, "learning_rate": 4.19112491642981e-06, "loss": 1.0906, "step": 9481 }, { "epoch": 0.29, "learning_rate": 4.190945264048409e-06, "loss": 1.2166, "step": 9482 }, { "epoch": 0.29, "learning_rate": 4.190765595570023e-06, "loss": 1.1394, "step": 9483 }, { "epoch": 0.29, "learning_rate": 4.190585910996364e-06, "loss": 1.1016, "step": 9484 }, { "epoch": 0.29, "learning_rate": 4.190406210329142e-06, "loss": 1.0838, "step": 9485 }, { "epoch": 0.29, "learning_rate": 4.1902264935700654e-06, "loss": 1.2679, "step": 9486 }, { "epoch": 0.29, "learning_rate": 4.190046760720847e-06, "loss": 1.2755, "step": 9487 }, { "epoch": 0.29, "learning_rate": 4.189867011783198e-06, "loss": 1.212, "step": 9488 }, { "epoch": 0.29, "learning_rate": 4.189687246758829e-06, "loss": 1.1346, "step": 9489 }, { "epoch": 0.29, "learning_rate": 4.18950746564945e-06, "loss": 1.1402, "step": 9490 }, { "epoch": 0.29, "learning_rate": 4.189327668456775e-06, "loss": 1.1199, "step": 9491 }, { "epoch": 0.29, "learning_rate": 4.1891478551825135e-06, "loss": 1.2639, "step": 9492 }, { "epoch": 0.29, "learning_rate": 4.188968025828379e-06, "loss": 1.2617, "step": 9493 }, { "epoch": 0.29, "learning_rate": 4.188788180396081e-06, "loss": 1.1759, "step": 9494 }, { "epoch": 0.29, "learning_rate": 4.188608318887333e-06, "loss": 1.1495, "step": 9495 }, { "epoch": 0.29, "learning_rate": 4.188428441303848e-06, "loss": 1.138, "step": 9496 }, { "epoch": 0.29, "learning_rate": 4.1882485476473365e-06, "loss": 1.1138, "step": 9497 }, { "epoch": 0.29, "learning_rate": 4.188068637919512e-06, "loss": 1.2137, "step": 9498 }, { "epoch": 0.29, "learning_rate": 4.187888712122088e-06, "loss": 1.2172, "step": 9499 }, { "epoch": 0.29, "learning_rate": 4.1877087702567755e-06, "loss": 1.1246, "step": 9500 }, { "epoch": 0.29, "learning_rate": 4.187528812325288e-06, "loss": 1.1843, "step": 9501 }, { "epoch": 0.29, "learning_rate": 4.187348838329339e-06, "loss": 1.1258, "step": 9502 }, { "epoch": 0.29, "learning_rate": 4.187168848270642e-06, "loss": 1.0752, "step": 9503 }, { "epoch": 0.29, "learning_rate": 4.186988842150911e-06, "loss": 1.198, "step": 9504 }, { "epoch": 0.29, "learning_rate": 4.186808819971858e-06, "loss": 1.2917, "step": 9505 }, { "epoch": 0.29, "learning_rate": 4.1866287817351975e-06, "loss": 1.105, "step": 9506 }, { "epoch": 0.29, "learning_rate": 4.186448727442643e-06, "loss": 1.0679, "step": 9507 }, { "epoch": 0.29, "learning_rate": 4.186268657095909e-06, "loss": 1.1721, "step": 9508 }, { "epoch": 0.29, "learning_rate": 4.1860885706967095e-06, "loss": 1.1388, "step": 9509 }, { "epoch": 0.29, "learning_rate": 4.185908468246759e-06, "loss": 1.0605, "step": 9510 }, { "epoch": 0.29, "learning_rate": 4.1857283497477715e-06, "loss": 1.0897, "step": 9511 }, { "epoch": 0.29, "learning_rate": 4.185548215201463e-06, "loss": 1.1776, "step": 9512 }, { "epoch": 0.29, "learning_rate": 4.185368064609546e-06, "loss": 1.1985, "step": 9513 }, { "epoch": 0.29, "learning_rate": 4.185187897973738e-06, "loss": 1.0872, "step": 9514 }, { "epoch": 0.29, "learning_rate": 4.185007715295752e-06, "loss": 1.0969, "step": 9515 }, { "epoch": 0.29, "learning_rate": 4.184827516577303e-06, "loss": 1.1403, "step": 9516 }, { "epoch": 0.29, "learning_rate": 4.184647301820109e-06, "loss": 1.1327, "step": 9517 }, { "epoch": 0.29, "learning_rate": 4.184467071025884e-06, "loss": 1.1823, "step": 9518 }, { "epoch": 0.29, "learning_rate": 4.1842868241963435e-06, "loss": 1.1401, "step": 9519 }, { "epoch": 0.29, "learning_rate": 4.184106561333203e-06, "loss": 1.1782, "step": 9520 }, { "epoch": 0.29, "learning_rate": 4.18392628243818e-06, "loss": 1.1351, "step": 9521 }, { "epoch": 0.29, "learning_rate": 4.18374598751299e-06, "loss": 1.0831, "step": 9522 }, { "epoch": 0.29, "learning_rate": 4.183565676559349e-06, "loss": 1.1055, "step": 9523 }, { "epoch": 0.29, "learning_rate": 4.183385349578972e-06, "loss": 1.149, "step": 9524 }, { "epoch": 0.29, "learning_rate": 4.183205006573579e-06, "loss": 1.1682, "step": 9525 }, { "epoch": 0.29, "learning_rate": 4.183024647544884e-06, "loss": 1.1064, "step": 9526 }, { "epoch": 0.29, "learning_rate": 4.182844272494606e-06, "loss": 1.1085, "step": 9527 }, { "epoch": 0.29, "learning_rate": 4.1826638814244604e-06, "loss": 1.1107, "step": 9528 }, { "epoch": 0.29, "learning_rate": 4.182483474336164e-06, "loss": 1.1259, "step": 9529 }, { "epoch": 0.29, "learning_rate": 4.182303051231436e-06, "loss": 1.1759, "step": 9530 }, { "epoch": 0.29, "learning_rate": 4.182122612111994e-06, "loss": 1.1368, "step": 9531 }, { "epoch": 0.29, "learning_rate": 4.181942156979555e-06, "loss": 1.1359, "step": 9532 }, { "epoch": 0.29, "learning_rate": 4.181761685835835e-06, "loss": 1.2273, "step": 9533 }, { "epoch": 0.29, "learning_rate": 4.181581198682556e-06, "loss": 1.1318, "step": 9534 }, { "epoch": 0.29, "learning_rate": 4.181400695521432e-06, "loss": 1.1262, "step": 9535 }, { "epoch": 0.29, "learning_rate": 4.181220176354184e-06, "loss": 1.1763, "step": 9536 }, { "epoch": 0.29, "learning_rate": 4.181039641182528e-06, "loss": 1.316, "step": 9537 }, { "epoch": 0.29, "learning_rate": 4.180859090008187e-06, "loss": 1.167, "step": 9538 }, { "epoch": 0.29, "learning_rate": 4.180678522832875e-06, "loss": 1.1822, "step": 9539 }, { "epoch": 0.29, "learning_rate": 4.180497939658314e-06, "loss": 1.1786, "step": 9540 }, { "epoch": 0.29, "learning_rate": 4.180317340486221e-06, "loss": 1.2173, "step": 9541 }, { "epoch": 0.29, "learning_rate": 4.180136725318317e-06, "loss": 1.1357, "step": 9542 }, { "epoch": 0.29, "learning_rate": 4.17995609415632e-06, "loss": 1.1013, "step": 9543 }, { "epoch": 0.29, "learning_rate": 4.1797754470019505e-06, "loss": 1.2029, "step": 9544 }, { "epoch": 0.29, "learning_rate": 4.179594783856927e-06, "loss": 1.1138, "step": 9545 }, { "epoch": 0.29, "learning_rate": 4.179414104722971e-06, "loss": 1.1283, "step": 9546 }, { "epoch": 0.29, "learning_rate": 4.179233409601802e-06, "loss": 1.0884, "step": 9547 }, { "epoch": 0.29, "learning_rate": 4.179052698495138e-06, "loss": 1.1743, "step": 9548 }, { "epoch": 0.29, "learning_rate": 4.178871971404702e-06, "loss": 1.363, "step": 9549 }, { "epoch": 0.29, "learning_rate": 4.178691228332213e-06, "loss": 1.1027, "step": 9550 }, { "epoch": 0.29, "learning_rate": 4.178510469279392e-06, "loss": 1.0914, "step": 9551 }, { "epoch": 0.29, "learning_rate": 4.17832969424796e-06, "loss": 1.1279, "step": 9552 }, { "epoch": 0.29, "learning_rate": 4.178148903239638e-06, "loss": 1.1829, "step": 9553 }, { "epoch": 0.29, "learning_rate": 4.177968096256146e-06, "loss": 1.2865, "step": 9554 }, { "epoch": 0.29, "learning_rate": 4.177787273299207e-06, "loss": 1.1765, "step": 9555 }, { "epoch": 0.29, "learning_rate": 4.1776064343705395e-06, "loss": 1.2158, "step": 9556 }, { "epoch": 0.29, "learning_rate": 4.177425579471867e-06, "loss": 1.1722, "step": 9557 }, { "epoch": 0.29, "learning_rate": 4.1772447086049115e-06, "loss": 1.193, "step": 9558 }, { "epoch": 0.29, "learning_rate": 4.177063821771395e-06, "loss": 1.172, "step": 9559 }, { "epoch": 0.29, "learning_rate": 4.176882918973037e-06, "loss": 1.1126, "step": 9560 }, { "epoch": 0.29, "learning_rate": 4.176702000211562e-06, "loss": 1.1846, "step": 9561 }, { "epoch": 0.29, "learning_rate": 4.176521065488691e-06, "loss": 1.1702, "step": 9562 }, { "epoch": 0.29, "learning_rate": 4.176340114806148e-06, "loss": 1.2922, "step": 9563 }, { "epoch": 0.29, "learning_rate": 4.176159148165654e-06, "loss": 1.1052, "step": 9564 }, { "epoch": 0.29, "learning_rate": 4.1759781655689315e-06, "loss": 1.1022, "step": 9565 }, { "epoch": 0.29, "learning_rate": 4.175797167017704e-06, "loss": 1.1513, "step": 9566 }, { "epoch": 0.29, "learning_rate": 4.1756161525136954e-06, "loss": 1.1721, "step": 9567 }, { "epoch": 0.29, "learning_rate": 4.175435122058627e-06, "loss": 1.1328, "step": 9568 }, { "epoch": 0.29, "learning_rate": 4.1752540756542246e-06, "loss": 1.152, "step": 9569 }, { "epoch": 0.29, "learning_rate": 4.175073013302209e-06, "loss": 1.1282, "step": 9570 }, { "epoch": 0.29, "learning_rate": 4.174891935004306e-06, "loss": 1.2135, "step": 9571 }, { "epoch": 0.29, "learning_rate": 4.174710840762237e-06, "loss": 1.1877, "step": 9572 }, { "epoch": 0.29, "learning_rate": 4.174529730577729e-06, "loss": 1.2438, "step": 9573 }, { "epoch": 0.29, "learning_rate": 4.174348604452504e-06, "loss": 1.1089, "step": 9574 }, { "epoch": 0.29, "learning_rate": 4.174167462388286e-06, "loss": 0.9628, "step": 9575 }, { "epoch": 0.29, "learning_rate": 4.173986304386801e-06, "loss": 1.2133, "step": 9576 }, { "epoch": 0.29, "learning_rate": 4.1738051304497715e-06, "loss": 1.0756, "step": 9577 }, { "epoch": 0.29, "learning_rate": 4.173623940578924e-06, "loss": 1.1319, "step": 9578 }, { "epoch": 0.29, "learning_rate": 4.173442734775983e-06, "loss": 1.16, "step": 9579 }, { "epoch": 0.29, "learning_rate": 4.173261513042673e-06, "loss": 1.0016, "step": 9580 }, { "epoch": 0.29, "learning_rate": 4.173080275380718e-06, "loss": 1.0426, "step": 9581 }, { "epoch": 0.29, "learning_rate": 4.172899021791845e-06, "loss": 1.1366, "step": 9582 }, { "epoch": 0.29, "learning_rate": 4.17271775227778e-06, "loss": 1.0723, "step": 9583 }, { "epoch": 0.29, "learning_rate": 4.172536466840247e-06, "loss": 1.1069, "step": 9584 }, { "epoch": 0.29, "learning_rate": 4.172355165480972e-06, "loss": 1.1569, "step": 9585 }, { "epoch": 0.29, "learning_rate": 4.172173848201682e-06, "loss": 1.1234, "step": 9586 }, { "epoch": 0.29, "learning_rate": 4.1719925150041014e-06, "loss": 1.2743, "step": 9587 }, { "epoch": 0.29, "learning_rate": 4.171811165889959e-06, "loss": 1.1417, "step": 9588 }, { "epoch": 0.29, "learning_rate": 4.171629800860978e-06, "loss": 1.136, "step": 9589 }, { "epoch": 0.29, "learning_rate": 4.171448419918887e-06, "loss": 1.114, "step": 9590 }, { "epoch": 0.29, "learning_rate": 4.171267023065412e-06, "loss": 1.0451, "step": 9591 }, { "epoch": 0.29, "learning_rate": 4.17108561030228e-06, "loss": 1.0865, "step": 9592 }, { "epoch": 0.29, "learning_rate": 4.1709041816312166e-06, "loss": 1.2806, "step": 9593 }, { "epoch": 0.29, "learning_rate": 4.170722737053951e-06, "loss": 1.1603, "step": 9594 }, { "epoch": 0.29, "learning_rate": 4.17054127657221e-06, "loss": 1.1169, "step": 9595 }, { "epoch": 0.29, "learning_rate": 4.17035980018772e-06, "loss": 1.1422, "step": 9596 }, { "epoch": 0.29, "learning_rate": 4.170178307902209e-06, "loss": 1.0699, "step": 9597 }, { "epoch": 0.29, "learning_rate": 4.169996799717405e-06, "loss": 1.0821, "step": 9598 }, { "epoch": 0.29, "learning_rate": 4.169815275635037e-06, "loss": 1.1057, "step": 9599 }, { "epoch": 0.29, "learning_rate": 4.169633735656831e-06, "loss": 1.2035, "step": 9600 }, { "epoch": 0.29, "learning_rate": 4.169452179784516e-06, "loss": 1.1392, "step": 9601 }, { "epoch": 0.29, "learning_rate": 4.169270608019819e-06, "loss": 1.08, "step": 9602 }, { "epoch": 0.29, "learning_rate": 4.1690890203644715e-06, "loss": 1.1685, "step": 9603 }, { "epoch": 0.29, "learning_rate": 4.1689074168202e-06, "loss": 1.2422, "step": 9604 }, { "epoch": 0.29, "learning_rate": 4.168725797388733e-06, "loss": 1.0953, "step": 9605 }, { "epoch": 0.29, "learning_rate": 4.1685441620718e-06, "loss": 1.3172, "step": 9606 }, { "epoch": 0.29, "learning_rate": 4.168362510871131e-06, "loss": 1.0676, "step": 9607 }, { "epoch": 0.29, "learning_rate": 4.168180843788454e-06, "loss": 1.2297, "step": 9608 }, { "epoch": 0.29, "learning_rate": 4.167999160825499e-06, "loss": 1.1009, "step": 9609 }, { "epoch": 0.29, "learning_rate": 4.1678174619839955e-06, "loss": 1.2348, "step": 9610 }, { "epoch": 0.29, "learning_rate": 4.167635747265672e-06, "loss": 1.1794, "step": 9611 }, { "epoch": 0.29, "learning_rate": 4.16745401667226e-06, "loss": 1.0886, "step": 9612 }, { "epoch": 0.29, "learning_rate": 4.167272270205489e-06, "loss": 1.1249, "step": 9613 }, { "epoch": 0.29, "learning_rate": 4.167090507867089e-06, "loss": 1.1749, "step": 9614 }, { "epoch": 0.29, "learning_rate": 4.16690872965879e-06, "loss": 1.1409, "step": 9615 }, { "epoch": 0.29, "learning_rate": 4.166726935582323e-06, "loss": 1.1743, "step": 9616 }, { "epoch": 0.29, "learning_rate": 4.1665451256394175e-06, "loss": 1.0893, "step": 9617 }, { "epoch": 0.29, "learning_rate": 4.166363299831806e-06, "loss": 1.0935, "step": 9618 }, { "epoch": 0.29, "learning_rate": 4.166181458161218e-06, "loss": 1.0496, "step": 9619 }, { "epoch": 0.29, "learning_rate": 4.165999600629385e-06, "loss": 1.1134, "step": 9620 }, { "epoch": 0.29, "learning_rate": 4.165817727238039e-06, "loss": 1.1317, "step": 9621 }, { "epoch": 0.29, "learning_rate": 4.165635837988909e-06, "loss": 1.0972, "step": 9622 }, { "epoch": 0.29, "learning_rate": 4.1654539328837285e-06, "loss": 1.2238, "step": 9623 }, { "epoch": 0.29, "learning_rate": 4.165272011924229e-06, "loss": 1.2177, "step": 9624 }, { "epoch": 0.29, "learning_rate": 4.165090075112142e-06, "loss": 1.1663, "step": 9625 }, { "epoch": 0.29, "learning_rate": 4.1649081224491995e-06, "loss": 1.2571, "step": 9626 }, { "epoch": 0.29, "learning_rate": 4.164726153937133e-06, "loss": 1.1713, "step": 9627 }, { "epoch": 0.29, "learning_rate": 4.164544169577676e-06, "loss": 1.2252, "step": 9628 }, { "epoch": 0.29, "learning_rate": 4.16436216937256e-06, "loss": 1.0745, "step": 9629 }, { "epoch": 0.29, "learning_rate": 4.164180153323517e-06, "loss": 1.079, "step": 9630 }, { "epoch": 0.29, "learning_rate": 4.163998121432281e-06, "loss": 1.0889, "step": 9631 }, { "epoch": 0.29, "learning_rate": 4.163816073700584e-06, "loss": 1.158, "step": 9632 }, { "epoch": 0.29, "learning_rate": 4.16363401013016e-06, "loss": 1.1964, "step": 9633 }, { "epoch": 0.29, "learning_rate": 4.163451930722741e-06, "loss": 1.2223, "step": 9634 }, { "epoch": 0.29, "learning_rate": 4.1632698354800605e-06, "loss": 1.3336, "step": 9635 }, { "epoch": 0.29, "learning_rate": 4.1630877244038525e-06, "loss": 1.2394, "step": 9636 }, { "epoch": 0.29, "learning_rate": 4.162905597495851e-06, "loss": 1.2026, "step": 9637 }, { "epoch": 0.29, "learning_rate": 4.1627234547577876e-06, "loss": 1.1453, "step": 9638 }, { "epoch": 0.29, "learning_rate": 4.162541296191398e-06, "loss": 1.0596, "step": 9639 }, { "epoch": 0.29, "learning_rate": 4.162359121798417e-06, "loss": 1.0998, "step": 9640 }, { "epoch": 0.29, "learning_rate": 4.1621769315805776e-06, "loss": 1.1863, "step": 9641 }, { "epoch": 0.29, "learning_rate": 4.1619947255396146e-06, "loss": 1.1848, "step": 9642 }, { "epoch": 0.29, "learning_rate": 4.161812503677261e-06, "loss": 1.1863, "step": 9643 }, { "epoch": 0.29, "learning_rate": 4.161630265995254e-06, "loss": 1.1361, "step": 9644 }, { "epoch": 0.29, "learning_rate": 4.161448012495326e-06, "loss": 1.1376, "step": 9645 }, { "epoch": 0.29, "learning_rate": 4.161265743179214e-06, "loss": 1.08, "step": 9646 }, { "epoch": 0.29, "learning_rate": 4.161083458048652e-06, "loss": 1.1837, "step": 9647 }, { "epoch": 0.29, "learning_rate": 4.160901157105374e-06, "loss": 1.1358, "step": 9648 }, { "epoch": 0.29, "learning_rate": 4.160718840351119e-06, "loss": 1.1329, "step": 9649 }, { "epoch": 0.29, "learning_rate": 4.16053650778762e-06, "loss": 1.2667, "step": 9650 }, { "epoch": 0.29, "learning_rate": 4.1603541594166134e-06, "loss": 1.2214, "step": 9651 }, { "epoch": 0.29, "learning_rate": 4.160171795239834e-06, "loss": 1.1671, "step": 9652 }, { "epoch": 0.29, "learning_rate": 4.1599894152590195e-06, "loss": 1.157, "step": 9653 }, { "epoch": 0.29, "learning_rate": 4.159807019475904e-06, "loss": 1.3354, "step": 9654 }, { "epoch": 0.29, "learning_rate": 4.159624607892226e-06, "loss": 1.1206, "step": 9655 }, { "epoch": 0.29, "learning_rate": 4.15944218050972e-06, "loss": 1.223, "step": 9656 }, { "epoch": 0.29, "learning_rate": 4.159259737330126e-06, "loss": 1.1197, "step": 9657 }, { "epoch": 0.29, "learning_rate": 4.159077278355177e-06, "loss": 1.1111, "step": 9658 }, { "epoch": 0.29, "learning_rate": 4.158894803586611e-06, "loss": 1.1804, "step": 9659 }, { "epoch": 0.29, "learning_rate": 4.1587123130261655e-06, "loss": 1.1395, "step": 9660 }, { "epoch": 0.29, "learning_rate": 4.158529806675577e-06, "loss": 1.1776, "step": 9661 }, { "epoch": 0.29, "learning_rate": 4.158347284536585e-06, "loss": 1.1694, "step": 9662 }, { "epoch": 0.29, "learning_rate": 4.158164746610925e-06, "loss": 1.1665, "step": 9663 }, { "epoch": 0.29, "learning_rate": 4.157982192900335e-06, "loss": 1.1953, "step": 9664 }, { "epoch": 0.29, "learning_rate": 4.157799623406553e-06, "loss": 1.0346, "step": 9665 }, { "epoch": 0.29, "learning_rate": 4.157617038131317e-06, "loss": 1.0632, "step": 9666 }, { "epoch": 0.29, "learning_rate": 4.157434437076366e-06, "loss": 1.2751, "step": 9667 }, { "epoch": 0.29, "learning_rate": 4.1572518202434366e-06, "loss": 1.079, "step": 9668 }, { "epoch": 0.29, "learning_rate": 4.157069187634268e-06, "loss": 1.0463, "step": 9669 }, { "epoch": 0.29, "learning_rate": 4.156886539250599e-06, "loss": 1.0957, "step": 9670 }, { "epoch": 0.29, "learning_rate": 4.156703875094168e-06, "loss": 1.2181, "step": 9671 }, { "epoch": 0.29, "learning_rate": 4.1565211951667146e-06, "loss": 1.1816, "step": 9672 }, { "epoch": 0.29, "learning_rate": 4.1563384994699766e-06, "loss": 1.1617, "step": 9673 }, { "epoch": 0.29, "learning_rate": 4.156155788005693e-06, "loss": 1.1229, "step": 9674 }, { "epoch": 0.29, "learning_rate": 4.155973060775606e-06, "loss": 1.2529, "step": 9675 }, { "epoch": 0.29, "learning_rate": 4.155790317781452e-06, "loss": 1.0475, "step": 9676 }, { "epoch": 0.29, "learning_rate": 4.155607559024971e-06, "loss": 1.0893, "step": 9677 }, { "epoch": 0.29, "learning_rate": 4.155424784507904e-06, "loss": 1.1538, "step": 9678 }, { "epoch": 0.29, "learning_rate": 4.15524199423199e-06, "loss": 1.1436, "step": 9679 }, { "epoch": 0.29, "learning_rate": 4.15505918819897e-06, "loss": 1.2129, "step": 9680 }, { "epoch": 0.29, "learning_rate": 4.154876366410583e-06, "loss": 1.1234, "step": 9681 }, { "epoch": 0.29, "learning_rate": 4.154693528868571e-06, "loss": 1.2509, "step": 9682 }, { "epoch": 0.29, "learning_rate": 4.1545106755746725e-06, "loss": 1.0709, "step": 9683 }, { "epoch": 0.29, "learning_rate": 4.154327806530629e-06, "loss": 1.1382, "step": 9684 }, { "epoch": 0.29, "learning_rate": 4.154144921738182e-06, "loss": 1.1365, "step": 9685 }, { "epoch": 0.29, "learning_rate": 4.153962021199073e-06, "loss": 1.1061, "step": 9686 }, { "epoch": 0.29, "learning_rate": 4.153779104915041e-06, "loss": 1.2584, "step": 9687 }, { "epoch": 0.29, "learning_rate": 4.153596172887828e-06, "loss": 1.1842, "step": 9688 }, { "epoch": 0.29, "learning_rate": 4.153413225119177e-06, "loss": 1.1666, "step": 9689 }, { "epoch": 0.29, "learning_rate": 4.1532302616108275e-06, "loss": 1.154, "step": 9690 }, { "epoch": 0.29, "learning_rate": 4.153047282364522e-06, "loss": 1.1003, "step": 9691 }, { "epoch": 0.29, "learning_rate": 4.152864287382004e-06, "loss": 1.1698, "step": 9692 }, { "epoch": 0.29, "learning_rate": 4.152681276665013e-06, "loss": 0.9037, "step": 9693 }, { "epoch": 0.29, "learning_rate": 4.152498250215292e-06, "loss": 1.192, "step": 9694 }, { "epoch": 0.29, "learning_rate": 4.152315208034584e-06, "loss": 1.2195, "step": 9695 }, { "epoch": 0.29, "learning_rate": 4.15213215012463e-06, "loss": 1.0961, "step": 9696 }, { "epoch": 0.29, "learning_rate": 4.151949076487175e-06, "loss": 1.1879, "step": 9697 }, { "epoch": 0.29, "learning_rate": 4.151765987123959e-06, "loss": 1.1563, "step": 9698 }, { "epoch": 0.29, "learning_rate": 4.151582882036728e-06, "loss": 1.1219, "step": 9699 }, { "epoch": 0.29, "learning_rate": 4.1513997612272226e-06, "loss": 1.1359, "step": 9700 }, { "epoch": 0.29, "learning_rate": 4.151216624697186e-06, "loss": 1.1409, "step": 9701 }, { "epoch": 0.29, "learning_rate": 4.151033472448363e-06, "loss": 1.0704, "step": 9702 }, { "epoch": 0.29, "learning_rate": 4.150850304482497e-06, "loss": 1.0979, "step": 9703 }, { "epoch": 0.29, "learning_rate": 4.1506671208013305e-06, "loss": 1.1672, "step": 9704 }, { "epoch": 0.29, "learning_rate": 4.150483921406609e-06, "loss": 1.2411, "step": 9705 }, { "epoch": 0.29, "learning_rate": 4.150300706300075e-06, "loss": 1.0709, "step": 9706 }, { "epoch": 0.29, "learning_rate": 4.150117475483472e-06, "loss": 1.0923, "step": 9707 }, { "epoch": 0.29, "learning_rate": 4.1499342289585465e-06, "loss": 1.139, "step": 9708 }, { "epoch": 0.29, "learning_rate": 4.149750966727041e-06, "loss": 0.9995, "step": 9709 }, { "epoch": 0.29, "learning_rate": 4.149567688790702e-06, "loss": 1.1995, "step": 9710 }, { "epoch": 0.29, "learning_rate": 4.149384395151272e-06, "loss": 1.0845, "step": 9711 }, { "epoch": 0.29, "learning_rate": 4.149201085810497e-06, "loss": 1.1806, "step": 9712 }, { "epoch": 0.29, "learning_rate": 4.149017760770123e-06, "loss": 1.2311, "step": 9713 }, { "epoch": 0.29, "learning_rate": 4.148834420031893e-06, "loss": 1.026, "step": 9714 }, { "epoch": 0.29, "learning_rate": 4.148651063597553e-06, "loss": 1.1995, "step": 9715 }, { "epoch": 0.29, "learning_rate": 4.1484676914688505e-06, "loss": 1.1344, "step": 9716 }, { "epoch": 0.29, "learning_rate": 4.148284303647529e-06, "loss": 1.1312, "step": 9717 }, { "epoch": 0.29, "learning_rate": 4.148100900135334e-06, "loss": 1.0802, "step": 9718 }, { "epoch": 0.29, "learning_rate": 4.147917480934013e-06, "loss": 1.1541, "step": 9719 }, { "epoch": 0.29, "learning_rate": 4.1477340460453105e-06, "loss": 1.1227, "step": 9720 }, { "epoch": 0.29, "learning_rate": 4.1475505954709735e-06, "loss": 1.0814, "step": 9721 }, { "epoch": 0.29, "learning_rate": 4.147367129212749e-06, "loss": 1.1588, "step": 9722 }, { "epoch": 0.29, "learning_rate": 4.1471836472723824e-06, "loss": 1.1249, "step": 9723 }, { "epoch": 0.29, "learning_rate": 4.147000149651621e-06, "loss": 1.1204, "step": 9724 }, { "epoch": 0.29, "learning_rate": 4.146816636352211e-06, "loss": 1.1452, "step": 9725 }, { "epoch": 0.29, "learning_rate": 4.146633107375901e-06, "loss": 1.0214, "step": 9726 }, { "epoch": 0.29, "learning_rate": 4.146449562724435e-06, "loss": 1.0713, "step": 9727 }, { "epoch": 0.29, "learning_rate": 4.146266002399563e-06, "loss": 1.1755, "step": 9728 }, { "epoch": 0.29, "learning_rate": 4.146082426403032e-06, "loss": 1.1697, "step": 9729 }, { "epoch": 0.29, "learning_rate": 4.145898834736588e-06, "loss": 1.231, "step": 9730 }, { "epoch": 0.29, "learning_rate": 4.145715227401981e-06, "loss": 1.2272, "step": 9731 }, { "epoch": 0.29, "learning_rate": 4.145531604400956e-06, "loss": 1.052, "step": 9732 }, { "epoch": 0.29, "learning_rate": 4.145347965735265e-06, "loss": 1.1611, "step": 9733 }, { "epoch": 0.29, "learning_rate": 4.145164311406652e-06, "loss": 1.1027, "step": 9734 }, { "epoch": 0.29, "learning_rate": 4.144980641416868e-06, "loss": 1.1946, "step": 9735 }, { "epoch": 0.29, "learning_rate": 4.144796955767659e-06, "loss": 1.1225, "step": 9736 }, { "epoch": 0.29, "learning_rate": 4.144613254460777e-06, "loss": 1.1417, "step": 9737 }, { "epoch": 0.29, "learning_rate": 4.1444295374979685e-06, "loss": 1.1085, "step": 9738 }, { "epoch": 0.29, "learning_rate": 4.144245804880982e-06, "loss": 1.1996, "step": 9739 }, { "epoch": 0.29, "learning_rate": 4.144062056611568e-06, "loss": 1.0983, "step": 9740 }, { "epoch": 0.29, "learning_rate": 4.143878292691474e-06, "loss": 1.1187, "step": 9741 }, { "epoch": 0.29, "learning_rate": 4.143694513122452e-06, "loss": 1.1061, "step": 9742 }, { "epoch": 0.29, "learning_rate": 4.143510717906248e-06, "loss": 1.2452, "step": 9743 }, { "epoch": 0.29, "learning_rate": 4.143326907044616e-06, "loss": 1.1524, "step": 9744 }, { "epoch": 0.29, "learning_rate": 4.143143080539301e-06, "loss": 1.103, "step": 9745 }, { "epoch": 0.29, "learning_rate": 4.1429592383920565e-06, "loss": 1.0723, "step": 9746 }, { "epoch": 0.29, "learning_rate": 4.142775380604631e-06, "loss": 0.9992, "step": 9747 }, { "epoch": 0.29, "learning_rate": 4.1425915071787745e-06, "loss": 1.1544, "step": 9748 }, { "epoch": 0.29, "learning_rate": 4.142407618116239e-06, "loss": 1.1565, "step": 9749 }, { "epoch": 0.29, "learning_rate": 4.142223713418773e-06, "loss": 1.2004, "step": 9750 }, { "epoch": 0.29, "learning_rate": 4.142039793088129e-06, "loss": 1.1879, "step": 9751 }, { "epoch": 0.29, "learning_rate": 4.141855857126057e-06, "loss": 1.1091, "step": 9752 }, { "epoch": 0.29, "learning_rate": 4.141671905534307e-06, "loss": 1.0287, "step": 9753 }, { "epoch": 0.29, "learning_rate": 4.141487938314631e-06, "loss": 1.2289, "step": 9754 }, { "epoch": 0.29, "learning_rate": 4.141303955468782e-06, "loss": 1.1629, "step": 9755 }, { "epoch": 0.29, "learning_rate": 4.141119956998509e-06, "loss": 1.2401, "step": 9756 }, { "epoch": 0.29, "learning_rate": 4.140935942905564e-06, "loss": 1.2805, "step": 9757 }, { "epoch": 0.29, "learning_rate": 4.140751913191699e-06, "loss": 1.1412, "step": 9758 }, { "epoch": 0.29, "learning_rate": 4.140567867858667e-06, "loss": 1.1589, "step": 9759 }, { "epoch": 0.29, "learning_rate": 4.140383806908218e-06, "loss": 1.0331, "step": 9760 }, { "epoch": 0.29, "learning_rate": 4.140199730342106e-06, "loss": 1.2545, "step": 9761 }, { "epoch": 0.29, "learning_rate": 4.140015638162082e-06, "loss": 1.2242, "step": 9762 }, { "epoch": 0.29, "learning_rate": 4.139831530369899e-06, "loss": 1.1175, "step": 9763 }, { "epoch": 0.29, "learning_rate": 4.1396474069673095e-06, "loss": 1.1933, "step": 9764 }, { "epoch": 0.29, "learning_rate": 4.139463267956067e-06, "loss": 1.1622, "step": 9765 }, { "epoch": 0.29, "learning_rate": 4.139279113337923e-06, "loss": 1.0541, "step": 9766 }, { "epoch": 0.29, "learning_rate": 4.139094943114632e-06, "loss": 1.0701, "step": 9767 }, { "epoch": 0.29, "learning_rate": 4.138910757287946e-06, "loss": 1.1436, "step": 9768 }, { "epoch": 0.29, "learning_rate": 4.13872655585962e-06, "loss": 1.2374, "step": 9769 }, { "epoch": 0.29, "learning_rate": 4.138542338831405e-06, "loss": 1.2314, "step": 9770 }, { "epoch": 0.29, "learning_rate": 4.138358106205057e-06, "loss": 0.9623, "step": 9771 }, { "epoch": 0.29, "learning_rate": 4.138173857982329e-06, "loss": 1.1353, "step": 9772 }, { "epoch": 0.29, "learning_rate": 4.137989594164974e-06, "loss": 1.1803, "step": 9773 }, { "epoch": 0.29, "learning_rate": 4.137805314754747e-06, "loss": 1.1564, "step": 9774 }, { "epoch": 0.29, "learning_rate": 4.137621019753403e-06, "loss": 1.144, "step": 9775 }, { "epoch": 0.29, "learning_rate": 4.137436709162695e-06, "loss": 1.1915, "step": 9776 }, { "epoch": 0.29, "learning_rate": 4.137252382984378e-06, "loss": 1.1621, "step": 9777 }, { "epoch": 0.29, "learning_rate": 4.137068041220208e-06, "loss": 1.1743, "step": 9778 }, { "epoch": 0.29, "learning_rate": 4.136883683871937e-06, "loss": 1.112, "step": 9779 }, { "epoch": 0.29, "learning_rate": 4.136699310941324e-06, "loss": 1.0723, "step": 9780 }, { "epoch": 0.29, "learning_rate": 4.136514922430119e-06, "loss": 1.1245, "step": 9781 }, { "epoch": 0.29, "learning_rate": 4.136330518340082e-06, "loss": 1.183, "step": 9782 }, { "epoch": 0.29, "learning_rate": 4.136146098672966e-06, "loss": 1.0154, "step": 9783 }, { "epoch": 0.29, "learning_rate": 4.135961663430527e-06, "loss": 1.1312, "step": 9784 }, { "epoch": 0.29, "learning_rate": 4.135777212614521e-06, "loss": 1.1436, "step": 9785 }, { "epoch": 0.29, "learning_rate": 4.1355927462267046e-06, "loss": 1.0731, "step": 9786 }, { "epoch": 0.29, "learning_rate": 4.135408264268832e-06, "loss": 1.2017, "step": 9787 }, { "epoch": 0.29, "learning_rate": 4.13522376674266e-06, "loss": 1.0895, "step": 9788 }, { "epoch": 0.29, "learning_rate": 4.135039253649946e-06, "loss": 1.1625, "step": 9789 }, { "epoch": 0.29, "learning_rate": 4.134854724992445e-06, "loss": 1.1297, "step": 9790 }, { "epoch": 0.29, "learning_rate": 4.134670180771916e-06, "loss": 1.1292, "step": 9791 }, { "epoch": 0.29, "learning_rate": 4.134485620990113e-06, "loss": 1.1373, "step": 9792 }, { "epoch": 0.3, "learning_rate": 4.134301045648794e-06, "loss": 1.272, "step": 9793 }, { "epoch": 0.3, "learning_rate": 4.134116454749716e-06, "loss": 1.0109, "step": 9794 }, { "epoch": 0.3, "learning_rate": 4.133931848294637e-06, "loss": 1.1709, "step": 9795 }, { "epoch": 0.3, "learning_rate": 4.133747226285314e-06, "loss": 1.1177, "step": 9796 }, { "epoch": 0.3, "learning_rate": 4.133562588723503e-06, "loss": 1.1746, "step": 9797 }, { "epoch": 0.3, "learning_rate": 4.133377935610963e-06, "loss": 1.2121, "step": 9798 }, { "epoch": 0.3, "learning_rate": 4.133193266949453e-06, "loss": 1.1845, "step": 9799 }, { "epoch": 0.3, "learning_rate": 4.1330085827407295e-06, "loss": 1.0733, "step": 9800 }, { "epoch": 0.3, "learning_rate": 4.13282388298655e-06, "loss": 1.1776, "step": 9801 }, { "epoch": 0.3, "learning_rate": 4.132639167688674e-06, "loss": 1.0918, "step": 9802 }, { "epoch": 0.3, "learning_rate": 4.132454436848859e-06, "loss": 1.1086, "step": 9803 }, { "epoch": 0.3, "learning_rate": 4.132269690468865e-06, "loss": 1.1901, "step": 9804 }, { "epoch": 0.3, "learning_rate": 4.132084928550448e-06, "loss": 1.1762, "step": 9805 }, { "epoch": 0.3, "learning_rate": 4.1319001510953696e-06, "loss": 1.1398, "step": 9806 }, { "epoch": 0.3, "learning_rate": 4.1317153581053885e-06, "loss": 1.229, "step": 9807 }, { "epoch": 0.3, "learning_rate": 4.131530549582261e-06, "loss": 1.1296, "step": 9808 }, { "epoch": 0.3, "learning_rate": 4.13134572552775e-06, "loss": 1.0405, "step": 9809 }, { "epoch": 0.3, "learning_rate": 4.131160885943612e-06, "loss": 1.0872, "step": 9810 }, { "epoch": 0.3, "learning_rate": 4.13097603083161e-06, "loss": 1.1234, "step": 9811 }, { "epoch": 0.3, "learning_rate": 4.1307911601935e-06, "loss": 1.1848, "step": 9812 }, { "epoch": 0.3, "learning_rate": 4.130606274031045e-06, "loss": 1.2623, "step": 9813 }, { "epoch": 0.3, "learning_rate": 4.130421372346001e-06, "loss": 1.1791, "step": 9814 }, { "epoch": 0.3, "learning_rate": 4.130236455140134e-06, "loss": 1.0479, "step": 9815 }, { "epoch": 0.3, "learning_rate": 4.130051522415199e-06, "loss": 0.9941, "step": 9816 }, { "epoch": 0.3, "learning_rate": 4.129866574172959e-06, "loss": 1.1747, "step": 9817 }, { "epoch": 0.3, "learning_rate": 4.1296816104151745e-06, "loss": 1.1959, "step": 9818 }, { "epoch": 0.3, "learning_rate": 4.129496631143606e-06, "loss": 1.0965, "step": 9819 }, { "epoch": 0.3, "learning_rate": 4.129311636360014e-06, "loss": 1.1382, "step": 9820 }, { "epoch": 0.3, "learning_rate": 4.12912662606616e-06, "loss": 1.0879, "step": 9821 }, { "epoch": 0.3, "learning_rate": 4.1289416002638056e-06, "loss": 1.1624, "step": 9822 }, { "epoch": 0.3, "learning_rate": 4.1287565589547115e-06, "loss": 1.194, "step": 9823 }, { "epoch": 0.3, "learning_rate": 4.1285715021406396e-06, "loss": 1.1599, "step": 9824 }, { "epoch": 0.3, "learning_rate": 4.12838642982335e-06, "loss": 1.1587, "step": 9825 }, { "epoch": 0.3, "learning_rate": 4.1282013420046076e-06, "loss": 1.0378, "step": 9826 }, { "epoch": 0.3, "learning_rate": 4.128016238686171e-06, "loss": 1.1061, "step": 9827 }, { "epoch": 0.3, "learning_rate": 4.127831119869805e-06, "loss": 1.1478, "step": 9828 }, { "epoch": 0.3, "learning_rate": 4.12764598555727e-06, "loss": 1.0007, "step": 9829 }, { "epoch": 0.3, "learning_rate": 4.12746083575033e-06, "loss": 1.2175, "step": 9830 }, { "epoch": 0.3, "learning_rate": 4.127275670450746e-06, "loss": 1.2434, "step": 9831 }, { "epoch": 0.3, "learning_rate": 4.127090489660281e-06, "loss": 1.1686, "step": 9832 }, { "epoch": 0.3, "learning_rate": 4.1269052933807e-06, "loss": 1.0873, "step": 9833 }, { "epoch": 0.3, "learning_rate": 4.126720081613762e-06, "loss": 1.1706, "step": 9834 }, { "epoch": 0.3, "learning_rate": 4.126534854361234e-06, "loss": 1.1287, "step": 9835 }, { "epoch": 0.3, "learning_rate": 4.126349611624876e-06, "loss": 1.211, "step": 9836 }, { "epoch": 0.3, "learning_rate": 4.126164353406454e-06, "loss": 1.1652, "step": 9837 }, { "epoch": 0.3, "learning_rate": 4.12597907970773e-06, "loss": 1.0503, "step": 9838 }, { "epoch": 0.3, "learning_rate": 4.125793790530469e-06, "loss": 1.1912, "step": 9839 }, { "epoch": 0.3, "learning_rate": 4.125608485876433e-06, "loss": 1.0571, "step": 9840 }, { "epoch": 0.3, "learning_rate": 4.1254231657473876e-06, "loss": 1.1249, "step": 9841 }, { "epoch": 0.3, "learning_rate": 4.125237830145097e-06, "loss": 1.1879, "step": 9842 }, { "epoch": 0.3, "learning_rate": 4.125052479071324e-06, "loss": 1.1505, "step": 9843 }, { "epoch": 0.3, "learning_rate": 4.124867112527835e-06, "loss": 1.2619, "step": 9844 }, { "epoch": 0.3, "learning_rate": 4.124681730516394e-06, "loss": 1.1738, "step": 9845 }, { "epoch": 0.3, "learning_rate": 4.124496333038764e-06, "loss": 1.0844, "step": 9846 }, { "epoch": 0.3, "learning_rate": 4.124310920096712e-06, "loss": 1.1323, "step": 9847 }, { "epoch": 0.3, "learning_rate": 4.1241254916920025e-06, "loss": 1.0178, "step": 9848 }, { "epoch": 0.3, "learning_rate": 4.123940047826401e-06, "loss": 1.2441, "step": 9849 }, { "epoch": 0.3, "learning_rate": 4.123754588501671e-06, "loss": 1.1227, "step": 9850 }, { "epoch": 0.3, "learning_rate": 4.12356911371958e-06, "loss": 1.1286, "step": 9851 }, { "epoch": 0.3, "learning_rate": 4.123383623481893e-06, "loss": 1.1221, "step": 9852 }, { "epoch": 0.3, "learning_rate": 4.123198117790375e-06, "loss": 1.1612, "step": 9853 }, { "epoch": 0.3, "learning_rate": 4.123012596646795e-06, "loss": 1.1901, "step": 9854 }, { "epoch": 0.3, "learning_rate": 4.122827060052914e-06, "loss": 1.1395, "step": 9855 }, { "epoch": 0.3, "learning_rate": 4.122641508010503e-06, "loss": 1.2546, "step": 9856 }, { "epoch": 0.3, "learning_rate": 4.122455940521326e-06, "loss": 1.0449, "step": 9857 }, { "epoch": 0.3, "learning_rate": 4.122270357587148e-06, "loss": 1.2397, "step": 9858 }, { "epoch": 0.3, "learning_rate": 4.12208475920974e-06, "loss": 1.2028, "step": 9859 }, { "epoch": 0.3, "learning_rate": 4.121899145390864e-06, "loss": 1.1909, "step": 9860 }, { "epoch": 0.3, "learning_rate": 4.1217135161322915e-06, "loss": 1.1641, "step": 9861 }, { "epoch": 0.3, "learning_rate": 4.121527871435786e-06, "loss": 1.2375, "step": 9862 }, { "epoch": 0.3, "learning_rate": 4.121342211303116e-06, "loss": 1.0848, "step": 9863 }, { "epoch": 0.3, "learning_rate": 4.12115653573605e-06, "loss": 1.1084, "step": 9864 }, { "epoch": 0.3, "learning_rate": 4.120970844736354e-06, "loss": 1.1794, "step": 9865 }, { "epoch": 0.3, "learning_rate": 4.120785138305796e-06, "loss": 1.15, "step": 9866 }, { "epoch": 0.3, "learning_rate": 4.1205994164461445e-06, "loss": 1.1822, "step": 9867 }, { "epoch": 0.3, "learning_rate": 4.120413679159167e-06, "loss": 1.0887, "step": 9868 }, { "epoch": 0.3, "learning_rate": 4.120227926446632e-06, "loss": 1.1868, "step": 9869 }, { "epoch": 0.3, "learning_rate": 4.1200421583103065e-06, "loss": 1.0864, "step": 9870 }, { "epoch": 0.3, "learning_rate": 4.119856374751961e-06, "loss": 1.229, "step": 9871 }, { "epoch": 0.3, "learning_rate": 4.1196705757733625e-06, "loss": 1.2103, "step": 9872 }, { "epoch": 0.3, "learning_rate": 4.119484761376279e-06, "loss": 1.1919, "step": 9873 }, { "epoch": 0.3, "learning_rate": 4.119298931562482e-06, "loss": 1.0676, "step": 9874 }, { "epoch": 0.3, "learning_rate": 4.119113086333739e-06, "loss": 1.1521, "step": 9875 }, { "epoch": 0.3, "learning_rate": 4.118927225691819e-06, "loss": 1.1499, "step": 9876 }, { "epoch": 0.3, "learning_rate": 4.118741349638492e-06, "loss": 1.1293, "step": 9877 }, { "epoch": 0.3, "learning_rate": 4.118555458175526e-06, "loss": 1.0995, "step": 9878 }, { "epoch": 0.3, "learning_rate": 4.118369551304692e-06, "loss": 0.9854, "step": 9879 }, { "epoch": 0.3, "learning_rate": 4.1181836290277586e-06, "loss": 1.1115, "step": 9880 }, { "epoch": 0.3, "learning_rate": 4.117997691346498e-06, "loss": 1.2133, "step": 9881 }, { "epoch": 0.3, "learning_rate": 4.117811738262677e-06, "loss": 1.1517, "step": 9882 }, { "epoch": 0.3, "learning_rate": 4.117625769778068e-06, "loss": 1.1006, "step": 9883 }, { "epoch": 0.3, "learning_rate": 4.117439785894442e-06, "loss": 1.2326, "step": 9884 }, { "epoch": 0.3, "learning_rate": 4.117253786613566e-06, "loss": 1.1127, "step": 9885 }, { "epoch": 0.3, "learning_rate": 4.117067771937214e-06, "loss": 1.0957, "step": 9886 }, { "epoch": 0.3, "learning_rate": 4.116881741867156e-06, "loss": 1.278, "step": 9887 }, { "epoch": 0.3, "learning_rate": 4.116695696405162e-06, "loss": 1.152, "step": 9888 }, { "epoch": 0.3, "learning_rate": 4.116509635553003e-06, "loss": 1.1487, "step": 9889 }, { "epoch": 0.3, "learning_rate": 4.116323559312452e-06, "loss": 1.1134, "step": 9890 }, { "epoch": 0.3, "learning_rate": 4.116137467685278e-06, "loss": 1.1039, "step": 9891 }, { "epoch": 0.3, "learning_rate": 4.115951360673255e-06, "loss": 1.228, "step": 9892 }, { "epoch": 0.3, "learning_rate": 4.115765238278153e-06, "loss": 1.244, "step": 9893 }, { "epoch": 0.3, "learning_rate": 4.115579100501743e-06, "loss": 1.2045, "step": 9894 }, { "epoch": 0.3, "learning_rate": 4.115392947345799e-06, "loss": 1.1718, "step": 9895 }, { "epoch": 0.3, "learning_rate": 4.115206778812092e-06, "loss": 0.9818, "step": 9896 }, { "epoch": 0.3, "learning_rate": 4.1150205949023945e-06, "loss": 1.1551, "step": 9897 }, { "epoch": 0.3, "learning_rate": 4.114834395618478e-06, "loss": 1.1331, "step": 9898 }, { "epoch": 0.3, "learning_rate": 4.114648180962116e-06, "loss": 1.0781, "step": 9899 }, { "epoch": 0.3, "learning_rate": 4.114461950935082e-06, "loss": 1.0768, "step": 9900 }, { "epoch": 0.3, "learning_rate": 4.114275705539147e-06, "loss": 1.2082, "step": 9901 }, { "epoch": 0.3, "learning_rate": 4.114089444776085e-06, "loss": 1.1804, "step": 9902 }, { "epoch": 0.3, "learning_rate": 4.113903168647669e-06, "loss": 1.1207, "step": 9903 }, { "epoch": 0.3, "learning_rate": 4.113716877155671e-06, "loss": 1.1506, "step": 9904 }, { "epoch": 0.3, "learning_rate": 4.113530570301867e-06, "loss": 1.1027, "step": 9905 }, { "epoch": 0.3, "learning_rate": 4.113344248088028e-06, "loss": 1.1887, "step": 9906 }, { "epoch": 0.3, "learning_rate": 4.113157910515929e-06, "loss": 1.1719, "step": 9907 }, { "epoch": 0.3, "learning_rate": 4.112971557587344e-06, "loss": 1.1108, "step": 9908 }, { "epoch": 0.3, "learning_rate": 4.112785189304046e-06, "loss": 1.0629, "step": 9909 }, { "epoch": 0.3, "learning_rate": 4.112598805667811e-06, "loss": 1.2697, "step": 9910 }, { "epoch": 0.3, "learning_rate": 4.112412406680411e-06, "loss": 1.3131, "step": 9911 }, { "epoch": 0.3, "learning_rate": 4.112225992343621e-06, "loss": 1.1946, "step": 9912 }, { "epoch": 0.3, "learning_rate": 4.112039562659217e-06, "loss": 1.0739, "step": 9913 }, { "epoch": 0.3, "learning_rate": 4.111853117628972e-06, "loss": 1.1919, "step": 9914 }, { "epoch": 0.3, "learning_rate": 4.111666657254663e-06, "loss": 1.1151, "step": 9915 }, { "epoch": 0.3, "learning_rate": 4.111480181538062e-06, "loss": 1.1309, "step": 9916 }, { "epoch": 0.3, "learning_rate": 4.111293690480947e-06, "loss": 1.1885, "step": 9917 }, { "epoch": 0.3, "learning_rate": 4.1111071840850905e-06, "loss": 1.2582, "step": 9918 }, { "epoch": 0.3, "learning_rate": 4.110920662352271e-06, "loss": 1.2014, "step": 9919 }, { "epoch": 0.3, "learning_rate": 4.110734125284262e-06, "loss": 1.2196, "step": 9920 }, { "epoch": 0.3, "learning_rate": 4.1105475728828405e-06, "loss": 1.1223, "step": 9921 }, { "epoch": 0.3, "learning_rate": 4.110361005149781e-06, "loss": 1.161, "step": 9922 }, { "epoch": 0.3, "learning_rate": 4.110174422086861e-06, "loss": 1.2574, "step": 9923 }, { "epoch": 0.3, "learning_rate": 4.109987823695855e-06, "loss": 1.2155, "step": 9924 }, { "epoch": 0.3, "learning_rate": 4.109801209978541e-06, "loss": 1.1965, "step": 9925 }, { "epoch": 0.3, "learning_rate": 4.109614580936695e-06, "loss": 1.1501, "step": 9926 }, { "epoch": 0.3, "learning_rate": 4.1094279365720925e-06, "loss": 1.1118, "step": 9927 }, { "epoch": 0.3, "learning_rate": 4.109241276886513e-06, "loss": 1.058, "step": 9928 }, { "epoch": 0.3, "learning_rate": 4.10905460188173e-06, "loss": 1.2595, "step": 9929 }, { "epoch": 0.3, "learning_rate": 4.108867911559523e-06, "loss": 1.1948, "step": 9930 }, { "epoch": 0.3, "learning_rate": 4.108681205921667e-06, "loss": 1.2026, "step": 9931 }, { "epoch": 0.3, "learning_rate": 4.108494484969942e-06, "loss": 1.0459, "step": 9932 }, { "epoch": 0.3, "learning_rate": 4.108307748706124e-06, "loss": 1.0341, "step": 9933 }, { "epoch": 0.3, "learning_rate": 4.10812099713199e-06, "loss": 1.0862, "step": 9934 }, { "epoch": 0.3, "learning_rate": 4.10793423024932e-06, "loss": 1.0978, "step": 9935 }, { "epoch": 0.3, "learning_rate": 4.107747448059889e-06, "loss": 1.2947, "step": 9936 }, { "epoch": 0.3, "learning_rate": 4.107560650565477e-06, "loss": 1.2062, "step": 9937 }, { "epoch": 0.3, "learning_rate": 4.107373837767863e-06, "loss": 1.0739, "step": 9938 }, { "epoch": 0.3, "learning_rate": 4.107187009668823e-06, "loss": 1.1517, "step": 9939 }, { "epoch": 0.3, "learning_rate": 4.107000166270137e-06, "loss": 1.1888, "step": 9940 }, { "epoch": 0.3, "learning_rate": 4.106813307573584e-06, "loss": 1.1345, "step": 9941 }, { "epoch": 0.3, "learning_rate": 4.106626433580941e-06, "loss": 1.0248, "step": 9942 }, { "epoch": 0.3, "learning_rate": 4.106439544293989e-06, "loss": 1.2134, "step": 9943 }, { "epoch": 0.3, "learning_rate": 4.106252639714506e-06, "loss": 1.1412, "step": 9944 }, { "epoch": 0.3, "learning_rate": 4.106065719844272e-06, "loss": 1.1289, "step": 9945 }, { "epoch": 0.3, "learning_rate": 4.105878784685064e-06, "loss": 1.152, "step": 9946 }, { "epoch": 0.3, "learning_rate": 4.105691834238665e-06, "loss": 1.1224, "step": 9947 }, { "epoch": 0.3, "learning_rate": 4.105504868506853e-06, "loss": 1.1908, "step": 9948 }, { "epoch": 0.3, "learning_rate": 4.1053178874914075e-06, "loss": 1.0343, "step": 9949 }, { "epoch": 0.3, "learning_rate": 4.105130891194109e-06, "loss": 1.0865, "step": 9950 }, { "epoch": 0.3, "learning_rate": 4.104943879616738e-06, "loss": 1.1331, "step": 9951 }, { "epoch": 0.3, "learning_rate": 4.104756852761073e-06, "loss": 1.1252, "step": 9952 }, { "epoch": 0.3, "learning_rate": 4.1045698106288966e-06, "loss": 1.1588, "step": 9953 }, { "epoch": 0.3, "learning_rate": 4.104382753221988e-06, "loss": 1.0928, "step": 9954 }, { "epoch": 0.3, "learning_rate": 4.104195680542129e-06, "loss": 1.144, "step": 9955 }, { "epoch": 0.3, "learning_rate": 4.104008592591099e-06, "loss": 1.2859, "step": 9956 }, { "epoch": 0.3, "learning_rate": 4.103821489370679e-06, "loss": 1.2067, "step": 9957 }, { "epoch": 0.3, "learning_rate": 4.103634370882653e-06, "loss": 1.1135, "step": 9958 }, { "epoch": 0.3, "learning_rate": 4.103447237128798e-06, "loss": 1.0145, "step": 9959 }, { "epoch": 0.3, "learning_rate": 4.103260088110899e-06, "loss": 1.132, "step": 9960 }, { "epoch": 0.3, "learning_rate": 4.103072923830735e-06, "loss": 1.0706, "step": 9961 }, { "epoch": 0.3, "learning_rate": 4.10288574429009e-06, "loss": 1.1431, "step": 9962 }, { "epoch": 0.3, "learning_rate": 4.102698549490743e-06, "loss": 1.1324, "step": 9963 }, { "epoch": 0.3, "learning_rate": 4.1025113394344795e-06, "loss": 1.1288, "step": 9964 }, { "epoch": 0.3, "learning_rate": 4.102324114123079e-06, "loss": 1.1053, "step": 9965 }, { "epoch": 0.3, "learning_rate": 4.102136873558325e-06, "loss": 1.1105, "step": 9966 }, { "epoch": 0.3, "learning_rate": 4.1019496177419995e-06, "loss": 1.0883, "step": 9967 }, { "epoch": 0.3, "learning_rate": 4.101762346675885e-06, "loss": 1.129, "step": 9968 }, { "epoch": 0.3, "learning_rate": 4.101575060361764e-06, "loss": 1.1165, "step": 9969 }, { "epoch": 0.3, "learning_rate": 4.10138775880142e-06, "loss": 1.0329, "step": 9970 }, { "epoch": 0.3, "learning_rate": 4.101200441996636e-06, "loss": 1.1515, "step": 9971 }, { "epoch": 0.3, "learning_rate": 4.101013109949195e-06, "loss": 1.1216, "step": 9972 }, { "epoch": 0.3, "learning_rate": 4.10082576266088e-06, "loss": 1.0887, "step": 9973 }, { "epoch": 0.3, "learning_rate": 4.100638400133475e-06, "loss": 1.1234, "step": 9974 }, { "epoch": 0.3, "learning_rate": 4.100451022368763e-06, "loss": 1.2047, "step": 9975 }, { "epoch": 0.3, "learning_rate": 4.100263629368528e-06, "loss": 1.1671, "step": 9976 }, { "epoch": 0.3, "learning_rate": 4.1000762211345545e-06, "loss": 1.0895, "step": 9977 }, { "epoch": 0.3, "learning_rate": 4.099888797668626e-06, "loss": 1.0972, "step": 9978 }, { "epoch": 0.3, "learning_rate": 4.099701358972527e-06, "loss": 1.0827, "step": 9979 }, { "epoch": 0.3, "learning_rate": 4.0995139050480406e-06, "loss": 1.0312, "step": 9980 }, { "epoch": 0.3, "learning_rate": 4.099326435896952e-06, "loss": 1.2051, "step": 9981 }, { "epoch": 0.3, "learning_rate": 4.099138951521047e-06, "loss": 1.0886, "step": 9982 }, { "epoch": 0.3, "learning_rate": 4.098951451922108e-06, "loss": 1.069, "step": 9983 }, { "epoch": 0.3, "learning_rate": 4.098763937101923e-06, "loss": 1.1318, "step": 9984 }, { "epoch": 0.3, "learning_rate": 4.0985764070622735e-06, "loss": 1.131, "step": 9985 }, { "epoch": 0.3, "learning_rate": 4.098388861804948e-06, "loss": 1.165, "step": 9986 }, { "epoch": 0.3, "learning_rate": 4.09820130133173e-06, "loss": 1.0767, "step": 9987 }, { "epoch": 0.3, "learning_rate": 4.098013725644405e-06, "loss": 1.2391, "step": 9988 }, { "epoch": 0.3, "learning_rate": 4.097826134744758e-06, "loss": 1.152, "step": 9989 }, { "epoch": 0.3, "learning_rate": 4.097638528634578e-06, "loss": 1.1578, "step": 9990 }, { "epoch": 0.3, "learning_rate": 4.097450907315647e-06, "loss": 1.1172, "step": 9991 }, { "epoch": 0.3, "learning_rate": 4.097263270789753e-06, "loss": 1.1099, "step": 9992 }, { "epoch": 0.3, "learning_rate": 4.097075619058682e-06, "loss": 1.1518, "step": 9993 }, { "epoch": 0.3, "learning_rate": 4.09688795212422e-06, "loss": 1.0294, "step": 9994 }, { "epoch": 0.3, "learning_rate": 4.096700269988154e-06, "loss": 1.0969, "step": 9995 }, { "epoch": 0.3, "learning_rate": 4.096512572652271e-06, "loss": 1.1898, "step": 9996 }, { "epoch": 0.3, "learning_rate": 4.096324860118357e-06, "loss": 1.1284, "step": 9997 }, { "epoch": 0.3, "learning_rate": 4.096137132388199e-06, "loss": 1.1827, "step": 9998 }, { "epoch": 0.3, "learning_rate": 4.095949389463584e-06, "loss": 1.2163, "step": 9999 }, { "epoch": 0.3, "learning_rate": 4.0957616313463e-06, "loss": 1.0914, "step": 10000 }, { "epoch": 0.3, "learning_rate": 4.0955738580381335e-06, "loss": 1.1614, "step": 10001 }, { "epoch": 0.3, "learning_rate": 4.095386069540872e-06, "loss": 1.0653, "step": 10002 }, { "epoch": 0.3, "learning_rate": 4.095198265856304e-06, "loss": 1.1837, "step": 10003 }, { "epoch": 0.3, "learning_rate": 4.095010446986216e-06, "loss": 1.1422, "step": 10004 }, { "epoch": 0.3, "learning_rate": 4.094822612932397e-06, "loss": 1.2029, "step": 10005 }, { "epoch": 0.3, "learning_rate": 4.094634763696635e-06, "loss": 1.1937, "step": 10006 }, { "epoch": 0.3, "learning_rate": 4.094446899280719e-06, "loss": 1.2389, "step": 10007 }, { "epoch": 0.3, "learning_rate": 4.094259019686435e-06, "loss": 1.105, "step": 10008 }, { "epoch": 0.3, "learning_rate": 4.094071124915573e-06, "loss": 1.0355, "step": 10009 }, { "epoch": 0.3, "learning_rate": 4.093883214969922e-06, "loss": 1.0706, "step": 10010 }, { "epoch": 0.3, "learning_rate": 4.093695289851271e-06, "loss": 1.2085, "step": 10011 }, { "epoch": 0.3, "learning_rate": 4.0935073495614085e-06, "loss": 1.3231, "step": 10012 }, { "epoch": 0.3, "learning_rate": 4.093319394102123e-06, "loss": 1.129, "step": 10013 }, { "epoch": 0.3, "learning_rate": 4.093131423475204e-06, "loss": 1.1317, "step": 10014 }, { "epoch": 0.3, "learning_rate": 4.092943437682441e-06, "loss": 1.1503, "step": 10015 }, { "epoch": 0.3, "learning_rate": 4.092755436725624e-06, "loss": 1.1278, "step": 10016 }, { "epoch": 0.3, "learning_rate": 4.092567420606542e-06, "loss": 1.1334, "step": 10017 }, { "epoch": 0.3, "learning_rate": 4.092379389326986e-06, "loss": 1.2568, "step": 10018 }, { "epoch": 0.3, "learning_rate": 4.092191342888745e-06, "loss": 0.9924, "step": 10019 }, { "epoch": 0.3, "learning_rate": 4.092003281293608e-06, "loss": 1.116, "step": 10020 }, { "epoch": 0.3, "learning_rate": 4.091815204543368e-06, "loss": 1.1427, "step": 10021 }, { "epoch": 0.3, "learning_rate": 4.091627112639813e-06, "loss": 1.0361, "step": 10022 }, { "epoch": 0.3, "learning_rate": 4.091439005584735e-06, "loss": 1.1656, "step": 10023 }, { "epoch": 0.3, "learning_rate": 4.091250883379924e-06, "loss": 1.0895, "step": 10024 }, { "epoch": 0.3, "learning_rate": 4.09106274602717e-06, "loss": 1.1416, "step": 10025 }, { "epoch": 0.3, "learning_rate": 4.090874593528265e-06, "loss": 1.1525, "step": 10026 }, { "epoch": 0.3, "learning_rate": 4.090686425885002e-06, "loss": 1.2397, "step": 10027 }, { "epoch": 0.3, "learning_rate": 4.0904982430991695e-06, "loss": 1.0984, "step": 10028 }, { "epoch": 0.3, "learning_rate": 4.090310045172559e-06, "loss": 1.1357, "step": 10029 }, { "epoch": 0.3, "learning_rate": 4.090121832106962e-06, "loss": 1.1328, "step": 10030 }, { "epoch": 0.3, "learning_rate": 4.089933603904173e-06, "loss": 1.074, "step": 10031 }, { "epoch": 0.3, "learning_rate": 4.089745360565981e-06, "loss": 1.1788, "step": 10032 }, { "epoch": 0.3, "learning_rate": 4.0895571020941784e-06, "loss": 1.1847, "step": 10033 }, { "epoch": 0.3, "learning_rate": 4.0893688284905585e-06, "loss": 1.2043, "step": 10034 }, { "epoch": 0.3, "learning_rate": 4.0891805397569124e-06, "loss": 1.1945, "step": 10035 }, { "epoch": 0.3, "learning_rate": 4.088992235895033e-06, "loss": 1.1995, "step": 10036 }, { "epoch": 0.3, "learning_rate": 4.088803916906712e-06, "loss": 1.1744, "step": 10037 }, { "epoch": 0.3, "learning_rate": 4.0886155827937445e-06, "loss": 1.0411, "step": 10038 }, { "epoch": 0.3, "learning_rate": 4.088427233557921e-06, "loss": 1.0939, "step": 10039 }, { "epoch": 0.3, "learning_rate": 4.088238869201035e-06, "loss": 1.1204, "step": 10040 }, { "epoch": 0.3, "learning_rate": 4.08805048972488e-06, "loss": 1.2311, "step": 10041 }, { "epoch": 0.3, "learning_rate": 4.087862095131249e-06, "loss": 1.1502, "step": 10042 }, { "epoch": 0.3, "learning_rate": 4.087673685421936e-06, "loss": 1.1774, "step": 10043 }, { "epoch": 0.3, "learning_rate": 4.087485260598734e-06, "loss": 1.124, "step": 10044 }, { "epoch": 0.3, "learning_rate": 4.0872968206634366e-06, "loss": 1.1833, "step": 10045 }, { "epoch": 0.3, "learning_rate": 4.087108365617838e-06, "loss": 1.1857, "step": 10046 }, { "epoch": 0.3, "learning_rate": 4.086919895463733e-06, "loss": 0.9757, "step": 10047 }, { "epoch": 0.3, "learning_rate": 4.086731410202914e-06, "loss": 1.1901, "step": 10048 }, { "epoch": 0.3, "learning_rate": 4.086542909837176e-06, "loss": 1.1264, "step": 10049 }, { "epoch": 0.3, "learning_rate": 4.086354394368314e-06, "loss": 1.2325, "step": 10050 }, { "epoch": 0.3, "learning_rate": 4.086165863798123e-06, "loss": 1.1382, "step": 10051 }, { "epoch": 0.3, "learning_rate": 4.085977318128395e-06, "loss": 1.0564, "step": 10052 }, { "epoch": 0.3, "learning_rate": 4.085788757360929e-06, "loss": 1.0932, "step": 10053 }, { "epoch": 0.3, "learning_rate": 4.085600181497516e-06, "loss": 1.1896, "step": 10054 }, { "epoch": 0.3, "learning_rate": 4.085411590539954e-06, "loss": 1.1016, "step": 10055 }, { "epoch": 0.3, "learning_rate": 4.085222984490036e-06, "loss": 1.2921, "step": 10056 }, { "epoch": 0.3, "learning_rate": 4.08503436334956e-06, "loss": 1.2048, "step": 10057 }, { "epoch": 0.3, "learning_rate": 4.084845727120319e-06, "loss": 1.1332, "step": 10058 }, { "epoch": 0.3, "learning_rate": 4.0846570758041115e-06, "loss": 1.0916, "step": 10059 }, { "epoch": 0.3, "learning_rate": 4.08446840940273e-06, "loss": 1.2599, "step": 10060 }, { "epoch": 0.3, "learning_rate": 4.0842797279179735e-06, "loss": 1.04, "step": 10061 }, { "epoch": 0.3, "learning_rate": 4.084091031351637e-06, "loss": 1.2423, "step": 10062 }, { "epoch": 0.3, "learning_rate": 4.083902319705517e-06, "loss": 1.1963, "step": 10063 }, { "epoch": 0.3, "learning_rate": 4.0837135929814085e-06, "loss": 1.1412, "step": 10064 }, { "epoch": 0.3, "learning_rate": 4.083524851181111e-06, "loss": 1.197, "step": 10065 }, { "epoch": 0.3, "learning_rate": 4.083336094306419e-06, "loss": 1.215, "step": 10066 }, { "epoch": 0.3, "learning_rate": 4.083147322359129e-06, "loss": 1.0853, "step": 10067 }, { "epoch": 0.3, "learning_rate": 4.08295853534104e-06, "loss": 1.254, "step": 10068 }, { "epoch": 0.3, "learning_rate": 4.082769733253948e-06, "loss": 1.2221, "step": 10069 }, { "epoch": 0.3, "learning_rate": 4.0825809160996495e-06, "loss": 1.1762, "step": 10070 }, { "epoch": 0.3, "learning_rate": 4.082392083879944e-06, "loss": 1.0903, "step": 10071 }, { "epoch": 0.3, "learning_rate": 4.082203236596628e-06, "loss": 1.0743, "step": 10072 }, { "epoch": 0.3, "learning_rate": 4.082014374251498e-06, "loss": 1.2034, "step": 10073 }, { "epoch": 0.3, "learning_rate": 4.081825496846354e-06, "loss": 1.2487, "step": 10074 }, { "epoch": 0.3, "learning_rate": 4.081636604382994e-06, "loss": 1.2573, "step": 10075 }, { "epoch": 0.3, "learning_rate": 4.081447696863214e-06, "loss": 1.1698, "step": 10076 }, { "epoch": 0.3, "learning_rate": 4.081258774288814e-06, "loss": 1.1201, "step": 10077 }, { "epoch": 0.3, "learning_rate": 4.081069836661591e-06, "loss": 1.1195, "step": 10078 }, { "epoch": 0.3, "learning_rate": 4.0808808839833455e-06, "loss": 1.1664, "step": 10079 }, { "epoch": 0.3, "learning_rate": 4.080691916255875e-06, "loss": 1.1678, "step": 10080 }, { "epoch": 0.3, "learning_rate": 4.08050293348098e-06, "loss": 1.0999, "step": 10081 }, { "epoch": 0.3, "learning_rate": 4.080313935660456e-06, "loss": 1.1555, "step": 10082 }, { "epoch": 0.3, "learning_rate": 4.0801249227961065e-06, "loss": 1.1567, "step": 10083 }, { "epoch": 0.3, "learning_rate": 4.079935894889728e-06, "loss": 1.1218, "step": 10084 }, { "epoch": 0.3, "learning_rate": 4.07974685194312e-06, "loss": 1.1613, "step": 10085 }, { "epoch": 0.3, "learning_rate": 4.0795577939580844e-06, "loss": 0.9985, "step": 10086 }, { "epoch": 0.3, "learning_rate": 4.079368720936418e-06, "loss": 1.1166, "step": 10087 }, { "epoch": 0.3, "learning_rate": 4.079179632879923e-06, "loss": 1.1261, "step": 10088 }, { "epoch": 0.3, "learning_rate": 4.078990529790398e-06, "loss": 1.1124, "step": 10089 }, { "epoch": 0.3, "learning_rate": 4.078801411669643e-06, "loss": 1.0189, "step": 10090 }, { "epoch": 0.3, "learning_rate": 4.078612278519459e-06, "loss": 1.1625, "step": 10091 }, { "epoch": 0.3, "learning_rate": 4.078423130341648e-06, "loss": 1.1736, "step": 10092 }, { "epoch": 0.3, "learning_rate": 4.078233967138007e-06, "loss": 1.2054, "step": 10093 }, { "epoch": 0.3, "learning_rate": 4.07804478891034e-06, "loss": 1.163, "step": 10094 }, { "epoch": 0.3, "learning_rate": 4.077855595660446e-06, "loss": 1.1141, "step": 10095 }, { "epoch": 0.3, "learning_rate": 4.077666387390127e-06, "loss": 1.085, "step": 10096 }, { "epoch": 0.3, "learning_rate": 4.077477164101183e-06, "loss": 1.0945, "step": 10097 }, { "epoch": 0.3, "learning_rate": 4.077287925795418e-06, "loss": 1.141, "step": 10098 }, { "epoch": 0.3, "learning_rate": 4.07709867247463e-06, "loss": 1.002, "step": 10099 }, { "epoch": 0.3, "learning_rate": 4.076909404140622e-06, "loss": 1.0905, "step": 10100 }, { "epoch": 0.3, "learning_rate": 4.0767201207951975e-06, "loss": 1.2178, "step": 10101 }, { "epoch": 0.3, "learning_rate": 4.076530822440156e-06, "loss": 1.1934, "step": 10102 }, { "epoch": 0.3, "learning_rate": 4.0763415090773e-06, "loss": 1.0613, "step": 10103 }, { "epoch": 0.3, "learning_rate": 4.076152180708433e-06, "loss": 1.1722, "step": 10104 }, { "epoch": 0.3, "learning_rate": 4.075962837335356e-06, "loss": 1.2038, "step": 10105 }, { "epoch": 0.3, "learning_rate": 4.07577347895987e-06, "loss": 1.305, "step": 10106 }, { "epoch": 0.3, "learning_rate": 4.075584105583782e-06, "loss": 1.1104, "step": 10107 }, { "epoch": 0.3, "learning_rate": 4.07539471720889e-06, "loss": 1.1353, "step": 10108 }, { "epoch": 0.3, "learning_rate": 4.075205313837e-06, "loss": 1.2454, "step": 10109 }, { "epoch": 0.3, "learning_rate": 4.075015895469915e-06, "loss": 1.1125, "step": 10110 }, { "epoch": 0.3, "learning_rate": 4.074826462109436e-06, "loss": 1.1473, "step": 10111 }, { "epoch": 0.3, "learning_rate": 4.074637013757368e-06, "loss": 1.2164, "step": 10112 }, { "epoch": 0.3, "learning_rate": 4.074447550415513e-06, "loss": 1.1144, "step": 10113 }, { "epoch": 0.3, "learning_rate": 4.074258072085677e-06, "loss": 1.0328, "step": 10114 }, { "epoch": 0.3, "learning_rate": 4.074068578769661e-06, "loss": 1.2117, "step": 10115 }, { "epoch": 0.3, "learning_rate": 4.073879070469271e-06, "loss": 1.1312, "step": 10116 }, { "epoch": 0.3, "learning_rate": 4.073689547186311e-06, "loss": 1.0637, "step": 10117 }, { "epoch": 0.3, "learning_rate": 4.073500008922583e-06, "loss": 1.0377, "step": 10118 }, { "epoch": 0.3, "learning_rate": 4.073310455679894e-06, "loss": 1.1194, "step": 10119 }, { "epoch": 0.3, "learning_rate": 4.073120887460047e-06, "loss": 1.1047, "step": 10120 }, { "epoch": 0.3, "learning_rate": 4.072931304264846e-06, "loss": 1.0847, "step": 10121 }, { "epoch": 0.3, "learning_rate": 4.072741706096097e-06, "loss": 1.2738, "step": 10122 }, { "epoch": 0.3, "learning_rate": 4.072552092955604e-06, "loss": 1.1864, "step": 10123 }, { "epoch": 0.3, "learning_rate": 4.072362464845173e-06, "loss": 1.2369, "step": 10124 }, { "epoch": 0.31, "learning_rate": 4.072172821766608e-06, "loss": 1.1143, "step": 10125 }, { "epoch": 0.31, "learning_rate": 4.0719831637217154e-06, "loss": 1.1852, "step": 10126 }, { "epoch": 0.31, "learning_rate": 4.0717934907123e-06, "loss": 1.0833, "step": 10127 }, { "epoch": 0.31, "learning_rate": 4.071603802740168e-06, "loss": 1.1497, "step": 10128 }, { "epoch": 0.31, "learning_rate": 4.071414099807125e-06, "loss": 1.1605, "step": 10129 }, { "epoch": 0.31, "learning_rate": 4.0712243819149755e-06, "loss": 1.098, "step": 10130 }, { "epoch": 0.31, "learning_rate": 4.071034649065528e-06, "loss": 1.122, "step": 10131 }, { "epoch": 0.31, "learning_rate": 4.070844901260586e-06, "loss": 1.1776, "step": 10132 }, { "epoch": 0.31, "learning_rate": 4.070655138501956e-06, "loss": 1.1677, "step": 10133 }, { "epoch": 0.31, "learning_rate": 4.070465360791448e-06, "loss": 1.1572, "step": 10134 }, { "epoch": 0.31, "learning_rate": 4.070275568130865e-06, "loss": 1.1218, "step": 10135 }, { "epoch": 0.31, "learning_rate": 4.070085760522015e-06, "loss": 1.2822, "step": 10136 }, { "epoch": 0.31, "learning_rate": 4.069895937966705e-06, "loss": 1.2728, "step": 10137 }, { "epoch": 0.31, "learning_rate": 4.069706100466741e-06, "loss": 1.0971, "step": 10138 }, { "epoch": 0.31, "learning_rate": 4.0695162480239315e-06, "loss": 1.101, "step": 10139 }, { "epoch": 0.31, "learning_rate": 4.069326380640083e-06, "loss": 1.1124, "step": 10140 }, { "epoch": 0.31, "learning_rate": 4.0691364983170035e-06, "loss": 1.2338, "step": 10141 }, { "epoch": 0.31, "learning_rate": 4.0689466010565006e-06, "loss": 1.1014, "step": 10142 }, { "epoch": 0.31, "learning_rate": 4.06875668886038e-06, "loss": 1.2367, "step": 10143 }, { "epoch": 0.31, "learning_rate": 4.068566761730453e-06, "loss": 1.0699, "step": 10144 }, { "epoch": 0.31, "learning_rate": 4.068376819668525e-06, "loss": 1.1138, "step": 10145 }, { "epoch": 0.31, "learning_rate": 4.068186862676405e-06, "loss": 1.1321, "step": 10146 }, { "epoch": 0.31, "learning_rate": 4.067996890755902e-06, "loss": 1.2275, "step": 10147 }, { "epoch": 0.31, "learning_rate": 4.0678069039088236e-06, "loss": 1.0549, "step": 10148 }, { "epoch": 0.31, "learning_rate": 4.067616902136978e-06, "loss": 1.2181, "step": 10149 }, { "epoch": 0.31, "learning_rate": 4.067426885442175e-06, "loss": 1.0813, "step": 10150 }, { "epoch": 0.31, "learning_rate": 4.067236853826223e-06, "loss": 1.1931, "step": 10151 }, { "epoch": 0.31, "learning_rate": 4.067046807290931e-06, "loss": 1.1769, "step": 10152 }, { "epoch": 0.31, "learning_rate": 4.066856745838107e-06, "loss": 1.2437, "step": 10153 }, { "epoch": 0.31, "learning_rate": 4.0666666694695625e-06, "loss": 1.234, "step": 10154 }, { "epoch": 0.31, "learning_rate": 4.066476578187106e-06, "loss": 1.2228, "step": 10155 }, { "epoch": 0.31, "learning_rate": 4.0662864719925465e-06, "loss": 1.1017, "step": 10156 }, { "epoch": 0.31, "learning_rate": 4.0660963508876935e-06, "loss": 0.9763, "step": 10157 }, { "epoch": 0.31, "learning_rate": 4.065906214874359e-06, "loss": 1.0759, "step": 10158 }, { "epoch": 0.31, "learning_rate": 4.0657160639543506e-06, "loss": 1.1483, "step": 10159 }, { "epoch": 0.31, "learning_rate": 4.065525898129478e-06, "loss": 1.1333, "step": 10160 }, { "epoch": 0.31, "learning_rate": 4.065335717401555e-06, "loss": 1.1536, "step": 10161 }, { "epoch": 0.31, "learning_rate": 4.065145521772389e-06, "loss": 1.1459, "step": 10162 }, { "epoch": 0.31, "learning_rate": 4.064955311243792e-06, "loss": 1.0714, "step": 10163 }, { "epoch": 0.31, "learning_rate": 4.064765085817574e-06, "loss": 1.1463, "step": 10164 }, { "epoch": 0.31, "learning_rate": 4.064574845495545e-06, "loss": 1.0656, "step": 10165 }, { "epoch": 0.31, "learning_rate": 4.064384590279517e-06, "loss": 1.2289, "step": 10166 }, { "epoch": 0.31, "learning_rate": 4.064194320171303e-06, "loss": 1.0198, "step": 10167 }, { "epoch": 0.31, "learning_rate": 4.064004035172711e-06, "loss": 1.1606, "step": 10168 }, { "epoch": 0.31, "learning_rate": 4.063813735285554e-06, "loss": 1.1411, "step": 10169 }, { "epoch": 0.31, "learning_rate": 4.063623420511643e-06, "loss": 1.0795, "step": 10170 }, { "epoch": 0.31, "learning_rate": 4.0634330908527905e-06, "loss": 1.1871, "step": 10171 }, { "epoch": 0.31, "learning_rate": 4.063242746310808e-06, "loss": 1.0734, "step": 10172 }, { "epoch": 0.31, "learning_rate": 4.0630523868875075e-06, "loss": 1.2523, "step": 10173 }, { "epoch": 0.31, "learning_rate": 4.062862012584702e-06, "loss": 1.0998, "step": 10174 }, { "epoch": 0.31, "learning_rate": 4.062671623404201e-06, "loss": 1.1341, "step": 10175 }, { "epoch": 0.31, "learning_rate": 4.06248121934782e-06, "loss": 1.1763, "step": 10176 }, { "epoch": 0.31, "learning_rate": 4.06229080041737e-06, "loss": 1.0812, "step": 10177 }, { "epoch": 0.31, "learning_rate": 4.062100366614664e-06, "loss": 1.1714, "step": 10178 }, { "epoch": 0.31, "learning_rate": 4.061909917941515e-06, "loss": 1.0039, "step": 10179 }, { "epoch": 0.31, "learning_rate": 4.061719454399735e-06, "loss": 1.1827, "step": 10180 }, { "epoch": 0.31, "learning_rate": 4.061528975991138e-06, "loss": 1.2041, "step": 10181 }, { "epoch": 0.31, "learning_rate": 4.0613384827175386e-06, "loss": 1.1453, "step": 10182 }, { "epoch": 0.31, "learning_rate": 4.061147974580748e-06, "loss": 1.0822, "step": 10183 }, { "epoch": 0.31, "learning_rate": 4.0609574515825805e-06, "loss": 1.1788, "step": 10184 }, { "epoch": 0.31, "learning_rate": 4.060766913724849e-06, "loss": 1.1097, "step": 10185 }, { "epoch": 0.31, "learning_rate": 4.06057636100937e-06, "loss": 1.0635, "step": 10186 }, { "epoch": 0.31, "learning_rate": 4.060385793437954e-06, "loss": 1.0522, "step": 10187 }, { "epoch": 0.31, "learning_rate": 4.060195211012418e-06, "loss": 1.1661, "step": 10188 }, { "epoch": 0.31, "learning_rate": 4.060004613734574e-06, "loss": 1.1008, "step": 10189 }, { "epoch": 0.31, "learning_rate": 4.059814001606238e-06, "loss": 1.2606, "step": 10190 }, { "epoch": 0.31, "learning_rate": 4.059623374629224e-06, "loss": 1.116, "step": 10191 }, { "epoch": 0.31, "learning_rate": 4.059432732805346e-06, "loss": 1.1479, "step": 10192 }, { "epoch": 0.31, "learning_rate": 4.0592420761364195e-06, "loss": 1.261, "step": 10193 }, { "epoch": 0.31, "learning_rate": 4.05905140462426e-06, "loss": 1.2662, "step": 10194 }, { "epoch": 0.31, "learning_rate": 4.0588607182706815e-06, "loss": 1.045, "step": 10195 }, { "epoch": 0.31, "learning_rate": 4.0586700170775e-06, "loss": 1.0954, "step": 10196 }, { "epoch": 0.31, "learning_rate": 4.0584793010465304e-06, "loss": 1.2181, "step": 10197 }, { "epoch": 0.31, "learning_rate": 4.058288570179589e-06, "loss": 1.2256, "step": 10198 }, { "epoch": 0.31, "learning_rate": 4.0580978244784905e-06, "loss": 1.2106, "step": 10199 }, { "epoch": 0.31, "learning_rate": 4.057907063945051e-06, "loss": 1.0932, "step": 10200 }, { "epoch": 0.31, "learning_rate": 4.0577162885810865e-06, "loss": 1.1363, "step": 10201 }, { "epoch": 0.31, "learning_rate": 4.057525498388414e-06, "loss": 1.0909, "step": 10202 }, { "epoch": 0.31, "learning_rate": 4.057334693368848e-06, "loss": 1.1407, "step": 10203 }, { "epoch": 0.31, "learning_rate": 4.057143873524206e-06, "loss": 1.2061, "step": 10204 }, { "epoch": 0.31, "learning_rate": 4.056953038856304e-06, "loss": 1.172, "step": 10205 }, { "epoch": 0.31, "learning_rate": 4.056762189366959e-06, "loss": 1.1124, "step": 10206 }, { "epoch": 0.31, "learning_rate": 4.056571325057988e-06, "loss": 1.2313, "step": 10207 }, { "epoch": 0.31, "learning_rate": 4.056380445931208e-06, "loss": 1.0823, "step": 10208 }, { "epoch": 0.31, "learning_rate": 4.056189551988435e-06, "loss": 1.1032, "step": 10209 }, { "epoch": 0.31, "learning_rate": 4.0559986432314865e-06, "loss": 1.109, "step": 10210 }, { "epoch": 0.31, "learning_rate": 4.0558077196621815e-06, "loss": 1.0253, "step": 10211 }, { "epoch": 0.31, "learning_rate": 4.055616781282335e-06, "loss": 1.2036, "step": 10212 }, { "epoch": 0.31, "learning_rate": 4.055425828093768e-06, "loss": 1.12, "step": 10213 }, { "epoch": 0.31, "learning_rate": 4.055234860098295e-06, "loss": 1.1929, "step": 10214 }, { "epoch": 0.31, "learning_rate": 4.0550438772977354e-06, "loss": 1.1744, "step": 10215 }, { "epoch": 0.31, "learning_rate": 4.054852879693906e-06, "loss": 1.1407, "step": 10216 }, { "epoch": 0.31, "learning_rate": 4.0546618672886275e-06, "loss": 1.2477, "step": 10217 }, { "epoch": 0.31, "learning_rate": 4.0544708400837165e-06, "loss": 1.1721, "step": 10218 }, { "epoch": 0.31, "learning_rate": 4.054279798080991e-06, "loss": 1.0205, "step": 10219 }, { "epoch": 0.31, "learning_rate": 4.054088741282271e-06, "loss": 1.1035, "step": 10220 }, { "epoch": 0.31, "learning_rate": 4.053897669689374e-06, "loss": 1.1109, "step": 10221 }, { "epoch": 0.31, "learning_rate": 4.05370658330412e-06, "loss": 1.1222, "step": 10222 }, { "epoch": 0.31, "learning_rate": 4.0535154821283275e-06, "loss": 1.0482, "step": 10223 }, { "epoch": 0.31, "learning_rate": 4.0533243661638165e-06, "loss": 1.2543, "step": 10224 }, { "epoch": 0.31, "learning_rate": 4.053133235412404e-06, "loss": 1.0768, "step": 10225 }, { "epoch": 0.31, "learning_rate": 4.052942089875913e-06, "loss": 1.2316, "step": 10226 }, { "epoch": 0.31, "learning_rate": 4.05275092955616e-06, "loss": 1.1245, "step": 10227 }, { "epoch": 0.31, "learning_rate": 4.052559754454966e-06, "loss": 1.1315, "step": 10228 }, { "epoch": 0.31, "learning_rate": 4.052368564574151e-06, "loss": 1.1902, "step": 10229 }, { "epoch": 0.31, "learning_rate": 4.052177359915536e-06, "loss": 1.1949, "step": 10230 }, { "epoch": 0.31, "learning_rate": 4.051986140480939e-06, "loss": 1.0196, "step": 10231 }, { "epoch": 0.31, "learning_rate": 4.051794906272182e-06, "loss": 1.1765, "step": 10232 }, { "epoch": 0.31, "learning_rate": 4.051603657291084e-06, "loss": 1.0203, "step": 10233 }, { "epoch": 0.31, "learning_rate": 4.051412393539468e-06, "loss": 1.1162, "step": 10234 }, { "epoch": 0.31, "learning_rate": 4.051221115019151e-06, "loss": 1.1208, "step": 10235 }, { "epoch": 0.31, "learning_rate": 4.051029821731958e-06, "loss": 1.1666, "step": 10236 }, { "epoch": 0.31, "learning_rate": 4.050838513679707e-06, "loss": 1.1889, "step": 10237 }, { "epoch": 0.31, "learning_rate": 4.050647190864221e-06, "loss": 1.0987, "step": 10238 }, { "epoch": 0.31, "learning_rate": 4.050455853287321e-06, "loss": 1.0685, "step": 10239 }, { "epoch": 0.31, "learning_rate": 4.050264500950826e-06, "loss": 1.118, "step": 10240 }, { "epoch": 0.31, "learning_rate": 4.0500731338565615e-06, "loss": 1.2034, "step": 10241 }, { "epoch": 0.31, "learning_rate": 4.049881752006346e-06, "loss": 1.1823, "step": 10242 }, { "epoch": 0.31, "learning_rate": 4.049690355402004e-06, "loss": 1.207, "step": 10243 }, { "epoch": 0.31, "learning_rate": 4.049498944045355e-06, "loss": 1.201, "step": 10244 }, { "epoch": 0.31, "learning_rate": 4.049307517938223e-06, "loss": 1.1763, "step": 10245 }, { "epoch": 0.31, "learning_rate": 4.049116077082429e-06, "loss": 1.1572, "step": 10246 }, { "epoch": 0.31, "learning_rate": 4.0489246214797965e-06, "loss": 1.173, "step": 10247 }, { "epoch": 0.31, "learning_rate": 4.048733151132147e-06, "loss": 1.2016, "step": 10248 }, { "epoch": 0.31, "learning_rate": 4.048541666041304e-06, "loss": 1.1501, "step": 10249 }, { "epoch": 0.31, "learning_rate": 4.048350166209091e-06, "loss": 1.1863, "step": 10250 }, { "epoch": 0.31, "learning_rate": 4.048158651637329e-06, "loss": 1.2219, "step": 10251 }, { "epoch": 0.31, "learning_rate": 4.047967122327844e-06, "loss": 1.1171, "step": 10252 }, { "epoch": 0.31, "learning_rate": 4.0477755782824556e-06, "loss": 1.1216, "step": 10253 }, { "epoch": 0.31, "learning_rate": 4.04758401950299e-06, "loss": 1.0707, "step": 10254 }, { "epoch": 0.31, "learning_rate": 4.047392445991269e-06, "loss": 1.0812, "step": 10255 }, { "epoch": 0.31, "learning_rate": 4.0472008577491185e-06, "loss": 1.1754, "step": 10256 }, { "epoch": 0.31, "learning_rate": 4.04700925477836e-06, "loss": 1.2228, "step": 10257 }, { "epoch": 0.31, "learning_rate": 4.046817637080819e-06, "loss": 1.0179, "step": 10258 }, { "epoch": 0.31, "learning_rate": 4.046626004658319e-06, "loss": 1.1217, "step": 10259 }, { "epoch": 0.31, "learning_rate": 4.046434357512684e-06, "loss": 1.1237, "step": 10260 }, { "epoch": 0.31, "learning_rate": 4.046242695645739e-06, "loss": 1.2048, "step": 10261 }, { "epoch": 0.31, "learning_rate": 4.046051019059308e-06, "loss": 1.2523, "step": 10262 }, { "epoch": 0.31, "learning_rate": 4.045859327755216e-06, "loss": 1.2537, "step": 10263 }, { "epoch": 0.31, "learning_rate": 4.045667621735288e-06, "loss": 1.0999, "step": 10264 }, { "epoch": 0.31, "learning_rate": 4.045475901001349e-06, "loss": 1.0597, "step": 10265 }, { "epoch": 0.31, "learning_rate": 4.0452841655552226e-06, "loss": 1.1774, "step": 10266 }, { "epoch": 0.31, "learning_rate": 4.045092415398736e-06, "loss": 1.0837, "step": 10267 }, { "epoch": 0.31, "learning_rate": 4.0449006505337125e-06, "loss": 1.1476, "step": 10268 }, { "epoch": 0.31, "learning_rate": 4.044708870961981e-06, "loss": 1.0966, "step": 10269 }, { "epoch": 0.31, "learning_rate": 4.044517076685364e-06, "loss": 1.1435, "step": 10270 }, { "epoch": 0.31, "learning_rate": 4.0443252677056875e-06, "loss": 1.1859, "step": 10271 }, { "epoch": 0.31, "learning_rate": 4.04413344402478e-06, "loss": 1.0615, "step": 10272 }, { "epoch": 0.31, "learning_rate": 4.043941605644464e-06, "loss": 1.1167, "step": 10273 }, { "epoch": 0.31, "learning_rate": 4.0437497525665685e-06, "loss": 1.1609, "step": 10274 }, { "epoch": 0.31, "learning_rate": 4.043557884792918e-06, "loss": 1.076, "step": 10275 }, { "epoch": 0.31, "learning_rate": 4.0433660023253405e-06, "loss": 1.081, "step": 10276 }, { "epoch": 0.31, "learning_rate": 4.043174105165661e-06, "loss": 1.0626, "step": 10277 }, { "epoch": 0.31, "learning_rate": 4.042982193315709e-06, "loss": 1.1754, "step": 10278 }, { "epoch": 0.31, "learning_rate": 4.042790266777308e-06, "loss": 1.2939, "step": 10279 }, { "epoch": 0.31, "learning_rate": 4.042598325552288e-06, "loss": 1.1716, "step": 10280 }, { "epoch": 0.31, "learning_rate": 4.042406369642475e-06, "loss": 1.1556, "step": 10281 }, { "epoch": 0.31, "learning_rate": 4.042214399049695e-06, "loss": 1.1774, "step": 10282 }, { "epoch": 0.31, "learning_rate": 4.042022413775777e-06, "loss": 1.1431, "step": 10283 }, { "epoch": 0.31, "learning_rate": 4.041830413822549e-06, "loss": 1.092, "step": 10284 }, { "epoch": 0.31, "learning_rate": 4.0416383991918365e-06, "loss": 1.1396, "step": 10285 }, { "epoch": 0.31, "learning_rate": 4.04144636988547e-06, "loss": 1.1299, "step": 10286 }, { "epoch": 0.31, "learning_rate": 4.041254325905277e-06, "loss": 1.2035, "step": 10287 }, { "epoch": 0.31, "learning_rate": 4.041062267253084e-06, "loss": 1.121, "step": 10288 }, { "epoch": 0.31, "learning_rate": 4.04087019393072e-06, "loss": 1.145, "step": 10289 }, { "epoch": 0.31, "learning_rate": 4.040678105940016e-06, "loss": 1.1034, "step": 10290 }, { "epoch": 0.31, "learning_rate": 4.040486003282797e-06, "loss": 1.153, "step": 10291 }, { "epoch": 0.31, "learning_rate": 4.0402938859608935e-06, "loss": 1.1409, "step": 10292 }, { "epoch": 0.31, "learning_rate": 4.040101753976133e-06, "loss": 1.2387, "step": 10293 }, { "epoch": 0.31, "learning_rate": 4.039909607330347e-06, "loss": 1.2274, "step": 10294 }, { "epoch": 0.31, "learning_rate": 4.039717446025363e-06, "loss": 1.1188, "step": 10295 }, { "epoch": 0.31, "learning_rate": 4.0395252700630095e-06, "loss": 1.0495, "step": 10296 }, { "epoch": 0.31, "learning_rate": 4.039333079445118e-06, "loss": 1.1313, "step": 10297 }, { "epoch": 0.31, "learning_rate": 4.039140874173516e-06, "loss": 1.1692, "step": 10298 }, { "epoch": 0.31, "learning_rate": 4.038948654250034e-06, "loss": 1.0314, "step": 10299 }, { "epoch": 0.31, "learning_rate": 4.038756419676503e-06, "loss": 1.0992, "step": 10300 }, { "epoch": 0.31, "learning_rate": 4.038564170454752e-06, "loss": 1.0471, "step": 10301 }, { "epoch": 0.31, "learning_rate": 4.038371906586611e-06, "loss": 1.0923, "step": 10302 }, { "epoch": 0.31, "learning_rate": 4.0381796280739095e-06, "loss": 1.0692, "step": 10303 }, { "epoch": 0.31, "learning_rate": 4.0379873349184795e-06, "loss": 1.1288, "step": 10304 }, { "epoch": 0.31, "learning_rate": 4.03779502712215e-06, "loss": 1.3125, "step": 10305 }, { "epoch": 0.31, "learning_rate": 4.037602704686754e-06, "loss": 1.0709, "step": 10306 }, { "epoch": 0.31, "learning_rate": 4.037410367614119e-06, "loss": 1.1037, "step": 10307 }, { "epoch": 0.31, "learning_rate": 4.0372180159060795e-06, "loss": 1.0377, "step": 10308 }, { "epoch": 0.31, "learning_rate": 4.037025649564463e-06, "loss": 1.1296, "step": 10309 }, { "epoch": 0.31, "learning_rate": 4.036833268591104e-06, "loss": 1.0659, "step": 10310 }, { "epoch": 0.31, "learning_rate": 4.0366408729878315e-06, "loss": 1.2375, "step": 10311 }, { "epoch": 0.31, "learning_rate": 4.036448462756478e-06, "loss": 1.1771, "step": 10312 }, { "epoch": 0.31, "learning_rate": 4.036256037898876e-06, "loss": 1.1844, "step": 10313 }, { "epoch": 0.31, "learning_rate": 4.036063598416856e-06, "loss": 1.1656, "step": 10314 }, { "epoch": 0.31, "learning_rate": 4.03587114431225e-06, "loss": 1.006, "step": 10315 }, { "epoch": 0.31, "learning_rate": 4.0356786755868905e-06, "loss": 1.1232, "step": 10316 }, { "epoch": 0.31, "learning_rate": 4.03548619224261e-06, "loss": 1.1118, "step": 10317 }, { "epoch": 0.31, "learning_rate": 4.03529369428124e-06, "loss": 1.1945, "step": 10318 }, { "epoch": 0.31, "learning_rate": 4.035101181704613e-06, "loss": 1.1266, "step": 10319 }, { "epoch": 0.31, "learning_rate": 4.0349086545145636e-06, "loss": 1.0864, "step": 10320 }, { "epoch": 0.31, "learning_rate": 4.034716112712922e-06, "loss": 1.1467, "step": 10321 }, { "epoch": 0.31, "learning_rate": 4.034523556301523e-06, "loss": 1.1501, "step": 10322 }, { "epoch": 0.31, "learning_rate": 4.034330985282198e-06, "loss": 1.1185, "step": 10323 }, { "epoch": 0.31, "learning_rate": 4.034138399656781e-06, "loss": 1.2042, "step": 10324 }, { "epoch": 0.31, "learning_rate": 4.033945799427105e-06, "loss": 1.1445, "step": 10325 }, { "epoch": 0.31, "learning_rate": 4.033753184595004e-06, "loss": 1.1109, "step": 10326 }, { "epoch": 0.31, "learning_rate": 4.033560555162311e-06, "loss": 1.0106, "step": 10327 }, { "epoch": 0.31, "learning_rate": 4.033367911130862e-06, "loss": 1.1114, "step": 10328 }, { "epoch": 0.31, "learning_rate": 4.033175252502487e-06, "loss": 1.2789, "step": 10329 }, { "epoch": 0.31, "learning_rate": 4.032982579279023e-06, "loss": 1.0266, "step": 10330 }, { "epoch": 0.31, "learning_rate": 4.032789891462302e-06, "loss": 0.9451, "step": 10331 }, { "epoch": 0.31, "learning_rate": 4.032597189054161e-06, "loss": 1.246, "step": 10332 }, { "epoch": 0.31, "learning_rate": 4.032404472056432e-06, "loss": 1.0908, "step": 10333 }, { "epoch": 0.31, "learning_rate": 4.03221174047095e-06, "loss": 1.1401, "step": 10334 }, { "epoch": 0.31, "learning_rate": 4.032018994299551e-06, "loss": 1.0665, "step": 10335 }, { "epoch": 0.31, "learning_rate": 4.0318262335440694e-06, "loss": 1.051, "step": 10336 }, { "epoch": 0.31, "learning_rate": 4.031633458206339e-06, "loss": 1.139, "step": 10337 }, { "epoch": 0.31, "learning_rate": 4.031440668288196e-06, "loss": 1.1265, "step": 10338 }, { "epoch": 0.31, "learning_rate": 4.031247863791475e-06, "loss": 1.1139, "step": 10339 }, { "epoch": 0.31, "learning_rate": 4.031055044718012e-06, "loss": 1.1577, "step": 10340 }, { "epoch": 0.31, "learning_rate": 4.030862211069643e-06, "loss": 1.1646, "step": 10341 }, { "epoch": 0.31, "learning_rate": 4.030669362848202e-06, "loss": 1.158, "step": 10342 }, { "epoch": 0.31, "learning_rate": 4.030476500055527e-06, "loss": 1.2438, "step": 10343 }, { "epoch": 0.31, "learning_rate": 4.030283622693452e-06, "loss": 1.097, "step": 10344 }, { "epoch": 0.31, "learning_rate": 4.0300907307638134e-06, "loss": 1.0731, "step": 10345 }, { "epoch": 0.31, "learning_rate": 4.029897824268449e-06, "loss": 1.1813, "step": 10346 }, { "epoch": 0.31, "learning_rate": 4.029704903209194e-06, "loss": 1.1366, "step": 10347 }, { "epoch": 0.31, "learning_rate": 4.029511967587885e-06, "loss": 1.1295, "step": 10348 }, { "epoch": 0.31, "learning_rate": 4.029319017406359e-06, "loss": 1.1686, "step": 10349 }, { "epoch": 0.31, "learning_rate": 4.029126052666452e-06, "loss": 1.1707, "step": 10350 }, { "epoch": 0.31, "learning_rate": 4.0289330733700015e-06, "loss": 1.2001, "step": 10351 }, { "epoch": 0.31, "learning_rate": 4.028740079518844e-06, "loss": 1.1458, "step": 10352 }, { "epoch": 0.31, "learning_rate": 4.028547071114818e-06, "loss": 1.0965, "step": 10353 }, { "epoch": 0.31, "learning_rate": 4.02835404815976e-06, "loss": 1.177, "step": 10354 }, { "epoch": 0.31, "learning_rate": 4.0281610106555066e-06, "loss": 1.1562, "step": 10355 }, { "epoch": 0.31, "learning_rate": 4.0279679586038975e-06, "loss": 1.1841, "step": 10356 }, { "epoch": 0.31, "learning_rate": 4.027774892006769e-06, "loss": 1.1354, "step": 10357 }, { "epoch": 0.31, "learning_rate": 4.027581810865959e-06, "loss": 1.138, "step": 10358 }, { "epoch": 0.31, "learning_rate": 4.027388715183306e-06, "loss": 1.1128, "step": 10359 }, { "epoch": 0.31, "learning_rate": 4.027195604960649e-06, "loss": 1.0076, "step": 10360 }, { "epoch": 0.31, "learning_rate": 4.027002480199824e-06, "loss": 1.2086, "step": 10361 }, { "epoch": 0.31, "learning_rate": 4.026809340902672e-06, "loss": 1.2316, "step": 10362 }, { "epoch": 0.31, "learning_rate": 4.02661618707103e-06, "loss": 1.2454, "step": 10363 }, { "epoch": 0.31, "learning_rate": 4.026423018706737e-06, "loss": 1.061, "step": 10364 }, { "epoch": 0.31, "learning_rate": 4.026229835811631e-06, "loss": 1.0676, "step": 10365 }, { "epoch": 0.31, "learning_rate": 4.0260366383875525e-06, "loss": 1.0837, "step": 10366 }, { "epoch": 0.31, "learning_rate": 4.025843426436341e-06, "loss": 1.2296, "step": 10367 }, { "epoch": 0.31, "learning_rate": 4.025650199959835e-06, "loss": 1.1958, "step": 10368 }, { "epoch": 0.31, "learning_rate": 4.025456958959874e-06, "loss": 1.0295, "step": 10369 }, { "epoch": 0.31, "learning_rate": 4.025263703438296e-06, "loss": 1.0918, "step": 10370 }, { "epoch": 0.31, "learning_rate": 4.025070433396943e-06, "loss": 1.1219, "step": 10371 }, { "epoch": 0.31, "learning_rate": 4.024877148837654e-06, "loss": 1.0754, "step": 10372 }, { "epoch": 0.31, "learning_rate": 4.024683849762269e-06, "loss": 1.2504, "step": 10373 }, { "epoch": 0.31, "learning_rate": 4.024490536172628e-06, "loss": 1.1631, "step": 10374 }, { "epoch": 0.31, "learning_rate": 4.024297208070571e-06, "loss": 1.1603, "step": 10375 }, { "epoch": 0.31, "learning_rate": 4.024103865457939e-06, "loss": 1.1485, "step": 10376 }, { "epoch": 0.31, "learning_rate": 4.023910508336573e-06, "loss": 1.1053, "step": 10377 }, { "epoch": 0.31, "learning_rate": 4.023717136708311e-06, "loss": 1.1544, "step": 10378 }, { "epoch": 0.31, "learning_rate": 4.023523750574997e-06, "loss": 1.1713, "step": 10379 }, { "epoch": 0.31, "learning_rate": 4.023330349938471e-06, "loss": 1.1049, "step": 10380 }, { "epoch": 0.31, "learning_rate": 4.023136934800573e-06, "loss": 1.1478, "step": 10381 }, { "epoch": 0.31, "learning_rate": 4.022943505163145e-06, "loss": 1.1838, "step": 10382 }, { "epoch": 0.31, "learning_rate": 4.022750061028029e-06, "loss": 1.1557, "step": 10383 }, { "epoch": 0.31, "learning_rate": 4.0225566023970655e-06, "loss": 1.0837, "step": 10384 }, { "epoch": 0.31, "learning_rate": 4.022363129272095e-06, "loss": 1.1329, "step": 10385 }, { "epoch": 0.31, "learning_rate": 4.022169641654963e-06, "loss": 1.1564, "step": 10386 }, { "epoch": 0.31, "learning_rate": 4.021976139547507e-06, "loss": 1.0578, "step": 10387 }, { "epoch": 0.31, "learning_rate": 4.021782622951573e-06, "loss": 1.1483, "step": 10388 }, { "epoch": 0.31, "learning_rate": 4.021589091869e-06, "loss": 1.1927, "step": 10389 }, { "epoch": 0.31, "learning_rate": 4.021395546301633e-06, "loss": 1.1732, "step": 10390 }, { "epoch": 0.31, "learning_rate": 4.021201986251312e-06, "loss": 1.2123, "step": 10391 }, { "epoch": 0.31, "learning_rate": 4.021008411719881e-06, "loss": 1.187, "step": 10392 }, { "epoch": 0.31, "learning_rate": 4.020814822709183e-06, "loss": 1.2204, "step": 10393 }, { "epoch": 0.31, "learning_rate": 4.02062121922106e-06, "loss": 1.1274, "step": 10394 }, { "epoch": 0.31, "learning_rate": 4.020427601257355e-06, "loss": 1.177, "step": 10395 }, { "epoch": 0.31, "learning_rate": 4.020233968819911e-06, "loss": 1.078, "step": 10396 }, { "epoch": 0.31, "learning_rate": 4.020040321910574e-06, "loss": 1.2035, "step": 10397 }, { "epoch": 0.31, "learning_rate": 4.019846660531182e-06, "loss": 1.1465, "step": 10398 }, { "epoch": 0.31, "learning_rate": 4.019652984683584e-06, "loss": 1.1877, "step": 10399 }, { "epoch": 0.31, "learning_rate": 4.019459294369621e-06, "loss": 1.1901, "step": 10400 }, { "epoch": 0.31, "learning_rate": 4.019265589591138e-06, "loss": 1.1504, "step": 10401 }, { "epoch": 0.31, "learning_rate": 4.019071870349977e-06, "loss": 1.1025, "step": 10402 }, { "epoch": 0.31, "learning_rate": 4.0188781366479845e-06, "loss": 1.1677, "step": 10403 }, { "epoch": 0.31, "learning_rate": 4.018684388487003e-06, "loss": 1.1859, "step": 10404 }, { "epoch": 0.31, "learning_rate": 4.018490625868877e-06, "loss": 1.1692, "step": 10405 }, { "epoch": 0.31, "learning_rate": 4.018296848795452e-06, "loss": 1.0898, "step": 10406 }, { "epoch": 0.31, "learning_rate": 4.018103057268573e-06, "loss": 1.1477, "step": 10407 }, { "epoch": 0.31, "learning_rate": 4.017909251290083e-06, "loss": 1.1616, "step": 10408 }, { "epoch": 0.31, "learning_rate": 4.017715430861829e-06, "loss": 1.1425, "step": 10409 }, { "epoch": 0.31, "learning_rate": 4.017521595985655e-06, "loss": 1.1782, "step": 10410 }, { "epoch": 0.31, "learning_rate": 4.017327746663406e-06, "loss": 1.1207, "step": 10411 }, { "epoch": 0.31, "learning_rate": 4.017133882896927e-06, "loss": 1.248, "step": 10412 }, { "epoch": 0.31, "learning_rate": 4.016940004688064e-06, "loss": 1.1887, "step": 10413 }, { "epoch": 0.31, "learning_rate": 4.016746112038664e-06, "loss": 1.1758, "step": 10414 }, { "epoch": 0.31, "learning_rate": 4.0165522049505705e-06, "loss": 1.1321, "step": 10415 }, { "epoch": 0.31, "learning_rate": 4.016358283425631e-06, "loss": 1.1248, "step": 10416 }, { "epoch": 0.31, "learning_rate": 4.01616434746569e-06, "loss": 1.0544, "step": 10417 }, { "epoch": 0.31, "learning_rate": 4.015970397072595e-06, "loss": 1.1318, "step": 10418 }, { "epoch": 0.31, "learning_rate": 4.015776432248193e-06, "loss": 1.1371, "step": 10419 }, { "epoch": 0.31, "learning_rate": 4.015582452994328e-06, "loss": 1.1093, "step": 10420 }, { "epoch": 0.31, "learning_rate": 4.0153884593128485e-06, "loss": 1.1455, "step": 10421 }, { "epoch": 0.31, "learning_rate": 4.0151944512056016e-06, "loss": 1.1174, "step": 10422 }, { "epoch": 0.31, "learning_rate": 4.015000428674433e-06, "loss": 1.1624, "step": 10423 }, { "epoch": 0.31, "learning_rate": 4.0148063917211885e-06, "loss": 1.2302, "step": 10424 }, { "epoch": 0.31, "learning_rate": 4.014612340347718e-06, "loss": 1.2484, "step": 10425 }, { "epoch": 0.31, "learning_rate": 4.014418274555867e-06, "loss": 1.1152, "step": 10426 }, { "epoch": 0.31, "learning_rate": 4.014224194347483e-06, "loss": 1.0928, "step": 10427 }, { "epoch": 0.31, "learning_rate": 4.014030099724415e-06, "loss": 1.1824, "step": 10428 }, { "epoch": 0.31, "learning_rate": 4.013835990688509e-06, "loss": 1.049, "step": 10429 }, { "epoch": 0.31, "learning_rate": 4.013641867241613e-06, "loss": 1.1743, "step": 10430 }, { "epoch": 0.31, "learning_rate": 4.013447729385576e-06, "loss": 1.0594, "step": 10431 }, { "epoch": 0.31, "learning_rate": 4.013253577122246e-06, "loss": 1.1964, "step": 10432 }, { "epoch": 0.31, "learning_rate": 4.01305941045347e-06, "loss": 1.1301, "step": 10433 }, { "epoch": 0.31, "learning_rate": 4.012865229381098e-06, "loss": 1.1731, "step": 10434 }, { "epoch": 0.31, "learning_rate": 4.012671033906977e-06, "loss": 1.0541, "step": 10435 }, { "epoch": 0.31, "learning_rate": 4.012476824032956e-06, "loss": 1.0247, "step": 10436 }, { "epoch": 0.31, "learning_rate": 4.0122825997608835e-06, "loss": 1.2188, "step": 10437 }, { "epoch": 0.31, "learning_rate": 4.01208836109261e-06, "loss": 1.2303, "step": 10438 }, { "epoch": 0.31, "learning_rate": 4.011894108029983e-06, "loss": 1.1035, "step": 10439 }, { "epoch": 0.31, "learning_rate": 4.011699840574853e-06, "loss": 1.1331, "step": 10440 }, { "epoch": 0.31, "learning_rate": 4.011505558729069e-06, "loss": 1.1219, "step": 10441 }, { "epoch": 0.31, "learning_rate": 4.011311262494479e-06, "loss": 1.2502, "step": 10442 }, { "epoch": 0.31, "learning_rate": 4.011116951872933e-06, "loss": 1.1761, "step": 10443 }, { "epoch": 0.31, "learning_rate": 4.010922626866283e-06, "loss": 1.0863, "step": 10444 }, { "epoch": 0.31, "learning_rate": 4.010728287476377e-06, "loss": 1.1627, "step": 10445 }, { "epoch": 0.31, "learning_rate": 4.0105339337050644e-06, "loss": 1.0433, "step": 10446 }, { "epoch": 0.31, "learning_rate": 4.0103395655541965e-06, "loss": 1.0894, "step": 10447 }, { "epoch": 0.31, "learning_rate": 4.010145183025624e-06, "loss": 1.1462, "step": 10448 }, { "epoch": 0.31, "learning_rate": 4.009950786121196e-06, "loss": 1.2529, "step": 10449 }, { "epoch": 0.31, "learning_rate": 4.0097563748427635e-06, "loss": 1.0975, "step": 10450 }, { "epoch": 0.31, "learning_rate": 4.009561949192179e-06, "loss": 1.0382, "step": 10451 }, { "epoch": 0.31, "learning_rate": 4.00936750917129e-06, "loss": 1.1663, "step": 10452 }, { "epoch": 0.31, "learning_rate": 4.00917305478195e-06, "loss": 1.0093, "step": 10453 }, { "epoch": 0.31, "learning_rate": 4.008978586026009e-06, "loss": 1.248, "step": 10454 }, { "epoch": 0.31, "learning_rate": 4.00878410290532e-06, "loss": 1.1777, "step": 10455 }, { "epoch": 0.31, "learning_rate": 4.008589605421731e-06, "loss": 1.145, "step": 10456 }, { "epoch": 0.32, "learning_rate": 4.008395093577097e-06, "loss": 1.1592, "step": 10457 }, { "epoch": 0.32, "learning_rate": 4.008200567373267e-06, "loss": 1.2009, "step": 10458 }, { "epoch": 0.32, "learning_rate": 4.008006026812095e-06, "loss": 1.0914, "step": 10459 }, { "epoch": 0.32, "learning_rate": 4.0078114718954305e-06, "loss": 1.2372, "step": 10460 }, { "epoch": 0.32, "learning_rate": 4.007616902625128e-06, "loss": 1.3004, "step": 10461 }, { "epoch": 0.32, "learning_rate": 4.007422319003039e-06, "loss": 1.248, "step": 10462 }, { "epoch": 0.32, "learning_rate": 4.007227721031015e-06, "loss": 1.0767, "step": 10463 }, { "epoch": 0.32, "learning_rate": 4.007033108710909e-06, "loss": 1.1021, "step": 10464 }, { "epoch": 0.32, "learning_rate": 4.006838482044574e-06, "loss": 1.1082, "step": 10465 }, { "epoch": 0.32, "learning_rate": 4.006643841033862e-06, "loss": 1.1002, "step": 10466 }, { "epoch": 0.32, "learning_rate": 4.006449185680627e-06, "loss": 1.2366, "step": 10467 }, { "epoch": 0.32, "learning_rate": 4.006254515986721e-06, "loss": 1.137, "step": 10468 }, { "epoch": 0.32, "learning_rate": 4.006059831953996e-06, "loss": 1.1829, "step": 10469 }, { "epoch": 0.32, "learning_rate": 4.0058651335843076e-06, "loss": 1.1392, "step": 10470 }, { "epoch": 0.32, "learning_rate": 4.005670420879509e-06, "loss": 1.0908, "step": 10471 }, { "epoch": 0.32, "learning_rate": 4.005475693841453e-06, "loss": 1.1371, "step": 10472 }, { "epoch": 0.32, "learning_rate": 4.005280952471993e-06, "loss": 1.2518, "step": 10473 }, { "epoch": 0.32, "learning_rate": 4.005086196772984e-06, "loss": 1.0688, "step": 10474 }, { "epoch": 0.32, "learning_rate": 4.004891426746279e-06, "loss": 1.1096, "step": 10475 }, { "epoch": 0.32, "learning_rate": 4.004696642393732e-06, "loss": 1.1697, "step": 10476 }, { "epoch": 0.32, "learning_rate": 4.004501843717198e-06, "loss": 1.1443, "step": 10477 }, { "epoch": 0.32, "learning_rate": 4.004307030718531e-06, "loss": 1.1062, "step": 10478 }, { "epoch": 0.32, "learning_rate": 4.004112203399585e-06, "loss": 1.0556, "step": 10479 }, { "epoch": 0.32, "learning_rate": 4.003917361762216e-06, "loss": 1.2336, "step": 10480 }, { "epoch": 0.32, "learning_rate": 4.003722505808277e-06, "loss": 1.1093, "step": 10481 }, { "epoch": 0.32, "learning_rate": 4.0035276355396255e-06, "loss": 1.1203, "step": 10482 }, { "epoch": 0.32, "learning_rate": 4.003332750958114e-06, "loss": 1.0668, "step": 10483 }, { "epoch": 0.32, "learning_rate": 4.003137852065599e-06, "loss": 1.066, "step": 10484 }, { "epoch": 0.32, "learning_rate": 4.0029429388639354e-06, "loss": 1.1964, "step": 10485 }, { "epoch": 0.32, "learning_rate": 4.002748011354979e-06, "loss": 1.1721, "step": 10486 }, { "epoch": 0.32, "learning_rate": 4.002553069540585e-06, "loss": 1.2316, "step": 10487 }, { "epoch": 0.32, "learning_rate": 4.002358113422609e-06, "loss": 1.1347, "step": 10488 }, { "epoch": 0.32, "learning_rate": 4.002163143002909e-06, "loss": 1.0148, "step": 10489 }, { "epoch": 0.32, "learning_rate": 4.001968158283338e-06, "loss": 1.1055, "step": 10490 }, { "epoch": 0.32, "learning_rate": 4.001773159265754e-06, "loss": 1.1696, "step": 10491 }, { "epoch": 0.32, "learning_rate": 4.001578145952013e-06, "loss": 1.2183, "step": 10492 }, { "epoch": 0.32, "learning_rate": 4.001383118343971e-06, "loss": 1.0115, "step": 10493 }, { "epoch": 0.32, "learning_rate": 4.0011880764434856e-06, "loss": 1.0792, "step": 10494 }, { "epoch": 0.32, "learning_rate": 4.000993020252411e-06, "loss": 1.1988, "step": 10495 }, { "epoch": 0.32, "learning_rate": 4.000797949772607e-06, "loss": 1.1319, "step": 10496 }, { "epoch": 0.32, "learning_rate": 4.000602865005928e-06, "loss": 1.1716, "step": 10497 }, { "epoch": 0.32, "learning_rate": 4.000407765954234e-06, "loss": 1.2169, "step": 10498 }, { "epoch": 0.32, "learning_rate": 4.00021265261938e-06, "loss": 1.2073, "step": 10499 }, { "epoch": 0.32, "learning_rate": 4.000017525003224e-06, "loss": 1.1629, "step": 10500 }, { "epoch": 0.32, "learning_rate": 3.999822383107624e-06, "loss": 1.1044, "step": 10501 }, { "epoch": 0.32, "learning_rate": 3.999627226934437e-06, "loss": 1.095, "step": 10502 }, { "epoch": 0.32, "learning_rate": 3.999432056485521e-06, "loss": 1.0811, "step": 10503 }, { "epoch": 0.32, "learning_rate": 3.999236871762734e-06, "loss": 1.2385, "step": 10504 }, { "epoch": 0.32, "learning_rate": 3.999041672767933e-06, "loss": 1.201, "step": 10505 }, { "epoch": 0.32, "learning_rate": 3.998846459502979e-06, "loss": 1.0993, "step": 10506 }, { "epoch": 0.32, "learning_rate": 3.9986512319697275e-06, "loss": 1.1526, "step": 10507 }, { "epoch": 0.32, "learning_rate": 3.998455990170039e-06, "loss": 1.1164, "step": 10508 }, { "epoch": 0.32, "learning_rate": 3.99826073410577e-06, "loss": 1.1324, "step": 10509 }, { "epoch": 0.32, "learning_rate": 3.998065463778781e-06, "loss": 1.1595, "step": 10510 }, { "epoch": 0.32, "learning_rate": 3.99787017919093e-06, "loss": 1.2644, "step": 10511 }, { "epoch": 0.32, "learning_rate": 3.997674880344078e-06, "loss": 1.1653, "step": 10512 }, { "epoch": 0.32, "learning_rate": 3.99747956724008e-06, "loss": 1.0759, "step": 10513 }, { "epoch": 0.32, "learning_rate": 3.997284239880799e-06, "loss": 1.0551, "step": 10514 }, { "epoch": 0.32, "learning_rate": 3.997088898268093e-06, "loss": 1.1052, "step": 10515 }, { "epoch": 0.32, "learning_rate": 3.9968935424038216e-06, "loss": 1.1611, "step": 10516 }, { "epoch": 0.32, "learning_rate": 3.9966981722898444e-06, "loss": 1.0844, "step": 10517 }, { "epoch": 0.32, "learning_rate": 3.996502787928022e-06, "loss": 1.0613, "step": 10518 }, { "epoch": 0.32, "learning_rate": 3.996307389320213e-06, "loss": 1.1053, "step": 10519 }, { "epoch": 0.32, "learning_rate": 3.996111976468279e-06, "loss": 1.2008, "step": 10520 }, { "epoch": 0.32, "learning_rate": 3.995916549374079e-06, "loss": 1.1196, "step": 10521 }, { "epoch": 0.32, "learning_rate": 3.995721108039474e-06, "loss": 1.204, "step": 10522 }, { "epoch": 0.32, "learning_rate": 3.995525652466324e-06, "loss": 1.0634, "step": 10523 }, { "epoch": 0.32, "learning_rate": 3.995330182656491e-06, "loss": 1.1051, "step": 10524 }, { "epoch": 0.32, "learning_rate": 3.995134698611834e-06, "loss": 1.2432, "step": 10525 }, { "epoch": 0.32, "learning_rate": 3.994939200334216e-06, "loss": 1.1157, "step": 10526 }, { "epoch": 0.32, "learning_rate": 3.994743687825496e-06, "loss": 1.0895, "step": 10527 }, { "epoch": 0.32, "learning_rate": 3.994548161087536e-06, "loss": 1.1469, "step": 10528 }, { "epoch": 0.32, "learning_rate": 3.994352620122197e-06, "loss": 1.1069, "step": 10529 }, { "epoch": 0.32, "learning_rate": 3.9941570649313414e-06, "loss": 1.1566, "step": 10530 }, { "epoch": 0.32, "learning_rate": 3.993961495516829e-06, "loss": 1.1917, "step": 10531 }, { "epoch": 0.32, "learning_rate": 3.993765911880524e-06, "loss": 1.1522, "step": 10532 }, { "epoch": 0.32, "learning_rate": 3.993570314024287e-06, "loss": 1.0983, "step": 10533 }, { "epoch": 0.32, "learning_rate": 3.993374701949979e-06, "loss": 1.0328, "step": 10534 }, { "epoch": 0.32, "learning_rate": 3.993179075659463e-06, "loss": 1.084, "step": 10535 }, { "epoch": 0.32, "learning_rate": 3.992983435154602e-06, "loss": 1.1183, "step": 10536 }, { "epoch": 0.32, "learning_rate": 3.992787780437258e-06, "loss": 1.29, "step": 10537 }, { "epoch": 0.32, "learning_rate": 3.9925921115092925e-06, "loss": 1.0511, "step": 10538 }, { "epoch": 0.32, "learning_rate": 3.992396428372569e-06, "loss": 1.1677, "step": 10539 }, { "epoch": 0.32, "learning_rate": 3.992200731028951e-06, "loss": 1.0206, "step": 10540 }, { "epoch": 0.32, "learning_rate": 3.9920050194803e-06, "loss": 1.1812, "step": 10541 }, { "epoch": 0.32, "learning_rate": 3.99180929372848e-06, "loss": 1.1236, "step": 10542 }, { "epoch": 0.32, "learning_rate": 3.991613553775354e-06, "loss": 1.2388, "step": 10543 }, { "epoch": 0.32, "learning_rate": 3.9914177996227855e-06, "loss": 1.2332, "step": 10544 }, { "epoch": 0.32, "learning_rate": 3.991222031272637e-06, "loss": 1.1066, "step": 10545 }, { "epoch": 0.32, "learning_rate": 3.9910262487267745e-06, "loss": 1.1689, "step": 10546 }, { "epoch": 0.32, "learning_rate": 3.990830451987059e-06, "loss": 1.0651, "step": 10547 }, { "epoch": 0.32, "learning_rate": 3.990634641055356e-06, "loss": 1.1478, "step": 10548 }, { "epoch": 0.32, "learning_rate": 3.990438815933529e-06, "loss": 1.1174, "step": 10549 }, { "epoch": 0.32, "learning_rate": 3.990242976623443e-06, "loss": 1.1019, "step": 10550 }, { "epoch": 0.32, "learning_rate": 3.990047123126961e-06, "loss": 1.1611, "step": 10551 }, { "epoch": 0.32, "learning_rate": 3.989851255445948e-06, "loss": 1.1138, "step": 10552 }, { "epoch": 0.32, "learning_rate": 3.989655373582268e-06, "loss": 1.1112, "step": 10553 }, { "epoch": 0.32, "learning_rate": 3.989459477537787e-06, "loss": 1.2566, "step": 10554 }, { "epoch": 0.32, "learning_rate": 3.989263567314369e-06, "loss": 1.1953, "step": 10555 }, { "epoch": 0.32, "learning_rate": 3.989067642913879e-06, "loss": 1.0744, "step": 10556 }, { "epoch": 0.32, "learning_rate": 3.988871704338183e-06, "loss": 1.1869, "step": 10557 }, { "epoch": 0.32, "learning_rate": 3.988675751589145e-06, "loss": 1.0911, "step": 10558 }, { "epoch": 0.32, "learning_rate": 3.98847978466863e-06, "loss": 1.0786, "step": 10559 }, { "epoch": 0.32, "learning_rate": 3.988283803578505e-06, "loss": 1.0482, "step": 10560 }, { "epoch": 0.32, "learning_rate": 3.988087808320635e-06, "loss": 1.1973, "step": 10561 }, { "epoch": 0.32, "learning_rate": 3.9878917988968856e-06, "loss": 1.2367, "step": 10562 }, { "epoch": 0.32, "learning_rate": 3.9876957753091225e-06, "loss": 1.1248, "step": 10563 }, { "epoch": 0.32, "learning_rate": 3.9874997375592126e-06, "loss": 1.0973, "step": 10564 }, { "epoch": 0.32, "learning_rate": 3.987303685649021e-06, "loss": 1.0686, "step": 10565 }, { "epoch": 0.32, "learning_rate": 3.987107619580416e-06, "loss": 1.1152, "step": 10566 }, { "epoch": 0.32, "learning_rate": 3.986911539355261e-06, "loss": 1.203, "step": 10567 }, { "epoch": 0.32, "learning_rate": 3.986715444975426e-06, "loss": 1.1345, "step": 10568 }, { "epoch": 0.32, "learning_rate": 3.986519336442774e-06, "loss": 1.207, "step": 10569 }, { "epoch": 0.32, "learning_rate": 3.986323213759176e-06, "loss": 1.1248, "step": 10570 }, { "epoch": 0.32, "learning_rate": 3.986127076926495e-06, "loss": 1.0522, "step": 10571 }, { "epoch": 0.32, "learning_rate": 3.985930925946601e-06, "loss": 1.0813, "step": 10572 }, { "epoch": 0.32, "learning_rate": 3.985734760821361e-06, "loss": 1.274, "step": 10573 }, { "epoch": 0.32, "learning_rate": 3.98553858155264e-06, "loss": 1.1654, "step": 10574 }, { "epoch": 0.32, "learning_rate": 3.985342388142307e-06, "loss": 1.1221, "step": 10575 }, { "epoch": 0.32, "learning_rate": 3.985146180592231e-06, "loss": 1.2432, "step": 10576 }, { "epoch": 0.32, "learning_rate": 3.984949958904279e-06, "loss": 1.1581, "step": 10577 }, { "epoch": 0.32, "learning_rate": 3.984753723080317e-06, "loss": 1.1391, "step": 10578 }, { "epoch": 0.32, "learning_rate": 3.984557473122216e-06, "loss": 1.0671, "step": 10579 }, { "epoch": 0.32, "learning_rate": 3.984361209031841e-06, "loss": 1.1345, "step": 10580 }, { "epoch": 0.32, "learning_rate": 3.984164930811064e-06, "loss": 1.0135, "step": 10581 }, { "epoch": 0.32, "learning_rate": 3.983968638461752e-06, "loss": 1.1393, "step": 10582 }, { "epoch": 0.32, "learning_rate": 3.983772331985772e-06, "loss": 1.0478, "step": 10583 }, { "epoch": 0.32, "learning_rate": 3.983576011384994e-06, "loss": 1.034, "step": 10584 }, { "epoch": 0.32, "learning_rate": 3.983379676661287e-06, "loss": 1.0715, "step": 10585 }, { "epoch": 0.32, "learning_rate": 3.983183327816521e-06, "loss": 1.1971, "step": 10586 }, { "epoch": 0.32, "learning_rate": 3.982986964852564e-06, "loss": 1.1448, "step": 10587 }, { "epoch": 0.32, "learning_rate": 3.982790587771284e-06, "loss": 1.0583, "step": 10588 }, { "epoch": 0.32, "learning_rate": 3.982594196574552e-06, "loss": 1.1463, "step": 10589 }, { "epoch": 0.32, "learning_rate": 3.982397791264237e-06, "loss": 1.0603, "step": 10590 }, { "epoch": 0.32, "learning_rate": 3.982201371842209e-06, "loss": 1.1745, "step": 10591 }, { "epoch": 0.32, "learning_rate": 3.9820049383103385e-06, "loss": 1.2842, "step": 10592 }, { "epoch": 0.32, "learning_rate": 3.981808490670494e-06, "loss": 1.1752, "step": 10593 }, { "epoch": 0.32, "learning_rate": 3.9816120289245485e-06, "loss": 1.1559, "step": 10594 }, { "epoch": 0.32, "learning_rate": 3.981415553074368e-06, "loss": 1.1476, "step": 10595 }, { "epoch": 0.32, "learning_rate": 3.981219063121825e-06, "loss": 1.2113, "step": 10596 }, { "epoch": 0.32, "learning_rate": 3.98102255906879e-06, "loss": 1.0681, "step": 10597 }, { "epoch": 0.32, "learning_rate": 3.980826040917135e-06, "loss": 1.0986, "step": 10598 }, { "epoch": 0.32, "learning_rate": 3.980629508668728e-06, "loss": 1.0745, "step": 10599 }, { "epoch": 0.32, "learning_rate": 3.980432962325441e-06, "loss": 1.1158, "step": 10600 }, { "epoch": 0.32, "learning_rate": 3.9802364018891456e-06, "loss": 1.099, "step": 10601 }, { "epoch": 0.32, "learning_rate": 3.9800398273617125e-06, "loss": 1.147, "step": 10602 }, { "epoch": 0.32, "learning_rate": 3.979843238745013e-06, "loss": 1.1125, "step": 10603 }, { "epoch": 0.32, "learning_rate": 3.979646636040918e-06, "loss": 1.1595, "step": 10604 }, { "epoch": 0.32, "learning_rate": 3.9794500192513e-06, "loss": 1.0569, "step": 10605 }, { "epoch": 0.32, "learning_rate": 3.97925338837803e-06, "loss": 1.1454, "step": 10606 }, { "epoch": 0.32, "learning_rate": 3.979056743422982e-06, "loss": 1.1347, "step": 10607 }, { "epoch": 0.32, "learning_rate": 3.978860084388025e-06, "loss": 1.1367, "step": 10608 }, { "epoch": 0.32, "learning_rate": 3.978663411275032e-06, "loss": 1.0425, "step": 10609 }, { "epoch": 0.32, "learning_rate": 3.978466724085876e-06, "loss": 1.2788, "step": 10610 }, { "epoch": 0.32, "learning_rate": 3.978270022822428e-06, "loss": 1.1321, "step": 10611 }, { "epoch": 0.32, "learning_rate": 3.978073307486561e-06, "loss": 1.1912, "step": 10612 }, { "epoch": 0.32, "learning_rate": 3.97787657808015e-06, "loss": 1.149, "step": 10613 }, { "epoch": 0.32, "learning_rate": 3.977679834605064e-06, "loss": 1.1643, "step": 10614 }, { "epoch": 0.32, "learning_rate": 3.977483077063178e-06, "loss": 1.1033, "step": 10615 }, { "epoch": 0.32, "learning_rate": 3.977286305456365e-06, "loss": 1.1008, "step": 10616 }, { "epoch": 0.32, "learning_rate": 3.977089519786497e-06, "loss": 1.1292, "step": 10617 }, { "epoch": 0.32, "learning_rate": 3.976892720055448e-06, "loss": 1.1076, "step": 10618 }, { "epoch": 0.32, "learning_rate": 3.976695906265093e-06, "loss": 1.1439, "step": 10619 }, { "epoch": 0.32, "learning_rate": 3.976499078417304e-06, "loss": 1.2174, "step": 10620 }, { "epoch": 0.32, "learning_rate": 3.976302236513955e-06, "loss": 1.0042, "step": 10621 }, { "epoch": 0.32, "learning_rate": 3.976105380556919e-06, "loss": 1.1235, "step": 10622 }, { "epoch": 0.32, "learning_rate": 3.975908510548071e-06, "loss": 1.1158, "step": 10623 }, { "epoch": 0.32, "learning_rate": 3.975711626489285e-06, "loss": 1.2093, "step": 10624 }, { "epoch": 0.32, "learning_rate": 3.975514728382433e-06, "loss": 1.1267, "step": 10625 }, { "epoch": 0.32, "learning_rate": 3.9753178162293944e-06, "loss": 1.066, "step": 10626 }, { "epoch": 0.32, "learning_rate": 3.9751208900320395e-06, "loss": 1.0615, "step": 10627 }, { "epoch": 0.32, "learning_rate": 3.9749239497922445e-06, "loss": 1.0277, "step": 10628 }, { "epoch": 0.32, "learning_rate": 3.974726995511883e-06, "loss": 1.2012, "step": 10629 }, { "epoch": 0.32, "learning_rate": 3.974530027192831e-06, "loss": 1.309, "step": 10630 }, { "epoch": 0.32, "learning_rate": 3.974333044836964e-06, "loss": 1.0936, "step": 10631 }, { "epoch": 0.32, "learning_rate": 3.974136048446155e-06, "loss": 1.1257, "step": 10632 }, { "epoch": 0.32, "learning_rate": 3.9739390380222835e-06, "loss": 1.2662, "step": 10633 }, { "epoch": 0.32, "learning_rate": 3.97374201356722e-06, "loss": 1.123, "step": 10634 }, { "epoch": 0.32, "learning_rate": 3.973544975082843e-06, "loss": 1.1589, "step": 10635 }, { "epoch": 0.32, "learning_rate": 3.973347922571027e-06, "loss": 1.2373, "step": 10636 }, { "epoch": 0.32, "learning_rate": 3.973150856033648e-06, "loss": 1.1257, "step": 10637 }, { "epoch": 0.32, "learning_rate": 3.972953775472584e-06, "loss": 1.1584, "step": 10638 }, { "epoch": 0.32, "learning_rate": 3.972756680889709e-06, "loss": 1.1042, "step": 10639 }, { "epoch": 0.32, "learning_rate": 3.972559572286899e-06, "loss": 1.0947, "step": 10640 }, { "epoch": 0.32, "learning_rate": 3.972362449666031e-06, "loss": 1.0415, "step": 10641 }, { "epoch": 0.32, "learning_rate": 3.972165313028982e-06, "loss": 1.0959, "step": 10642 }, { "epoch": 0.32, "learning_rate": 3.971968162377628e-06, "loss": 1.0414, "step": 10643 }, { "epoch": 0.32, "learning_rate": 3.971770997713847e-06, "loss": 1.1181, "step": 10644 }, { "epoch": 0.32, "learning_rate": 3.9715738190395135e-06, "loss": 1.1152, "step": 10645 }, { "epoch": 0.32, "learning_rate": 3.971376626356507e-06, "loss": 1.1846, "step": 10646 }, { "epoch": 0.32, "learning_rate": 3.971179419666703e-06, "loss": 1.0968, "step": 10647 }, { "epoch": 0.32, "learning_rate": 3.97098219897198e-06, "loss": 1.2258, "step": 10648 }, { "epoch": 0.32, "learning_rate": 3.9707849642742145e-06, "loss": 1.0967, "step": 10649 }, { "epoch": 0.32, "learning_rate": 3.970587715575285e-06, "loss": 1.1, "step": 10650 }, { "epoch": 0.32, "learning_rate": 3.970390452877068e-06, "loss": 1.175, "step": 10651 }, { "epoch": 0.32, "learning_rate": 3.9701931761814424e-06, "loss": 1.0978, "step": 10652 }, { "epoch": 0.32, "learning_rate": 3.969995885490285e-06, "loss": 1.0355, "step": 10653 }, { "epoch": 0.32, "learning_rate": 3.969798580805476e-06, "loss": 1.0957, "step": 10654 }, { "epoch": 0.32, "learning_rate": 3.969601262128892e-06, "loss": 1.2228, "step": 10655 }, { "epoch": 0.32, "learning_rate": 3.969403929462412e-06, "loss": 1.1294, "step": 10656 }, { "epoch": 0.32, "learning_rate": 3.969206582807914e-06, "loss": 1.1888, "step": 10657 }, { "epoch": 0.32, "learning_rate": 3.9690092221672765e-06, "loss": 1.0966, "step": 10658 }, { "epoch": 0.32, "learning_rate": 3.968811847542379e-06, "loss": 1.1292, "step": 10659 }, { "epoch": 0.32, "learning_rate": 3.968614458935101e-06, "loss": 1.0689, "step": 10660 }, { "epoch": 0.32, "learning_rate": 3.96841705634732e-06, "loss": 1.0872, "step": 10661 }, { "epoch": 0.32, "learning_rate": 3.968219639780915e-06, "loss": 1.2256, "step": 10662 }, { "epoch": 0.32, "learning_rate": 3.968022209237768e-06, "loss": 1.3354, "step": 10663 }, { "epoch": 0.32, "learning_rate": 3.967824764719754e-06, "loss": 1.1561, "step": 10664 }, { "epoch": 0.32, "learning_rate": 3.967627306228757e-06, "loss": 1.0381, "step": 10665 }, { "epoch": 0.32, "learning_rate": 3.967429833766655e-06, "loss": 1.0506, "step": 10666 }, { "epoch": 0.32, "learning_rate": 3.967232347335327e-06, "loss": 1.177, "step": 10667 }, { "epoch": 0.32, "learning_rate": 3.967034846936654e-06, "loss": 1.1331, "step": 10668 }, { "epoch": 0.32, "learning_rate": 3.9668373325725165e-06, "loss": 1.359, "step": 10669 }, { "epoch": 0.32, "learning_rate": 3.966639804244793e-06, "loss": 0.9466, "step": 10670 }, { "epoch": 0.32, "learning_rate": 3.966442261955365e-06, "loss": 1.2065, "step": 10671 }, { "epoch": 0.32, "learning_rate": 3.966244705706113e-06, "loss": 1.0777, "step": 10672 }, { "epoch": 0.32, "learning_rate": 3.966047135498917e-06, "loss": 1.0813, "step": 10673 }, { "epoch": 0.32, "learning_rate": 3.96584955133566e-06, "loss": 1.1962, "step": 10674 }, { "epoch": 0.32, "learning_rate": 3.96565195321822e-06, "loss": 1.1246, "step": 10675 }, { "epoch": 0.32, "learning_rate": 3.9654543411484805e-06, "loss": 1.1189, "step": 10676 }, { "epoch": 0.32, "learning_rate": 3.965256715128319e-06, "loss": 1.1422, "step": 10677 }, { "epoch": 0.32, "learning_rate": 3.965059075159622e-06, "loss": 1.1667, "step": 10678 }, { "epoch": 0.32, "learning_rate": 3.964861421244266e-06, "loss": 1.2151, "step": 10679 }, { "epoch": 0.32, "learning_rate": 3.964663753384137e-06, "loss": 1.2306, "step": 10680 }, { "epoch": 0.32, "learning_rate": 3.964466071581113e-06, "loss": 1.1843, "step": 10681 }, { "epoch": 0.32, "learning_rate": 3.964268375837077e-06, "loss": 1.1824, "step": 10682 }, { "epoch": 0.32, "learning_rate": 3.964070666153913e-06, "loss": 1.178, "step": 10683 }, { "epoch": 0.32, "learning_rate": 3.963872942533499e-06, "loss": 1.1252, "step": 10684 }, { "epoch": 0.32, "learning_rate": 3.963675204977722e-06, "loss": 1.1852, "step": 10685 }, { "epoch": 0.32, "learning_rate": 3.96347745348846e-06, "loss": 1.1038, "step": 10686 }, { "epoch": 0.32, "learning_rate": 3.963279688067598e-06, "loss": 1.0657, "step": 10687 }, { "epoch": 0.32, "learning_rate": 3.9630819087170196e-06, "loss": 1.2084, "step": 10688 }, { "epoch": 0.32, "learning_rate": 3.9628841154386045e-06, "loss": 1.0806, "step": 10689 }, { "epoch": 0.32, "learning_rate": 3.962686308234237e-06, "loss": 1.1242, "step": 10690 }, { "epoch": 0.32, "learning_rate": 3.962488487105801e-06, "loss": 1.2128, "step": 10691 }, { "epoch": 0.32, "learning_rate": 3.962290652055179e-06, "loss": 1.2303, "step": 10692 }, { "epoch": 0.32, "learning_rate": 3.962092803084254e-06, "loss": 1.1125, "step": 10693 }, { "epoch": 0.32, "learning_rate": 3.96189494019491e-06, "loss": 1.0852, "step": 10694 }, { "epoch": 0.32, "learning_rate": 3.96169706338903e-06, "loss": 1.2003, "step": 10695 }, { "epoch": 0.32, "learning_rate": 3.961499172668498e-06, "loss": 1.0457, "step": 10696 }, { "epoch": 0.32, "learning_rate": 3.961301268035197e-06, "loss": 1.0368, "step": 10697 }, { "epoch": 0.32, "learning_rate": 3.961103349491013e-06, "loss": 1.0425, "step": 10698 }, { "epoch": 0.32, "learning_rate": 3.960905417037828e-06, "loss": 1.1694, "step": 10699 }, { "epoch": 0.32, "learning_rate": 3.9607074706775275e-06, "loss": 1.0845, "step": 10700 }, { "epoch": 0.32, "learning_rate": 3.960509510411995e-06, "loss": 1.1373, "step": 10701 }, { "epoch": 0.32, "learning_rate": 3.960311536243116e-06, "loss": 1.2296, "step": 10702 }, { "epoch": 0.32, "learning_rate": 3.9601135481727736e-06, "loss": 1.1427, "step": 10703 }, { "epoch": 0.32, "learning_rate": 3.959915546202854e-06, "loss": 1.2384, "step": 10704 }, { "epoch": 0.32, "learning_rate": 3.959717530335241e-06, "loss": 1.1359, "step": 10705 }, { "epoch": 0.32, "learning_rate": 3.959519500571821e-06, "loss": 1.199, "step": 10706 }, { "epoch": 0.32, "learning_rate": 3.959321456914477e-06, "loss": 1.103, "step": 10707 }, { "epoch": 0.32, "learning_rate": 3.959123399365097e-06, "loss": 1.0267, "step": 10708 }, { "epoch": 0.32, "learning_rate": 3.9589253279255635e-06, "loss": 1.2277, "step": 10709 }, { "epoch": 0.32, "learning_rate": 3.958727242597765e-06, "loss": 1.0142, "step": 10710 }, { "epoch": 0.32, "learning_rate": 3.958529143383585e-06, "loss": 1.0508, "step": 10711 }, { "epoch": 0.32, "learning_rate": 3.95833103028491e-06, "loss": 1.2543, "step": 10712 }, { "epoch": 0.32, "learning_rate": 3.958132903303626e-06, "loss": 1.1965, "step": 10713 }, { "epoch": 0.32, "learning_rate": 3.957934762441619e-06, "loss": 1.0305, "step": 10714 }, { "epoch": 0.32, "learning_rate": 3.957736607700775e-06, "loss": 1.0993, "step": 10715 }, { "epoch": 0.32, "learning_rate": 3.9575384390829804e-06, "loss": 1.1095, "step": 10716 }, { "epoch": 0.32, "learning_rate": 3.9573402565901225e-06, "loss": 1.1325, "step": 10717 }, { "epoch": 0.32, "learning_rate": 3.957142060224087e-06, "loss": 1.2188, "step": 10718 }, { "epoch": 0.32, "learning_rate": 3.956943849986761e-06, "loss": 1.1465, "step": 10719 }, { "epoch": 0.32, "learning_rate": 3.95674562588003e-06, "loss": 1.1373, "step": 10720 }, { "epoch": 0.32, "learning_rate": 3.956547387905784e-06, "loss": 1.1838, "step": 10721 }, { "epoch": 0.32, "learning_rate": 3.956349136065908e-06, "loss": 1.1133, "step": 10722 }, { "epoch": 0.32, "learning_rate": 3.956150870362289e-06, "loss": 1.2027, "step": 10723 }, { "epoch": 0.32, "learning_rate": 3.955952590796816e-06, "loss": 1.1536, "step": 10724 }, { "epoch": 0.32, "learning_rate": 3.955754297371374e-06, "loss": 1.1031, "step": 10725 }, { "epoch": 0.32, "learning_rate": 3.955555990087853e-06, "loss": 1.1827, "step": 10726 }, { "epoch": 0.32, "learning_rate": 3.9553576689481395e-06, "loss": 1.2281, "step": 10727 }, { "epoch": 0.32, "learning_rate": 3.955159333954123e-06, "loss": 1.033, "step": 10728 }, { "epoch": 0.32, "learning_rate": 3.95496098510769e-06, "loss": 1.0958, "step": 10729 }, { "epoch": 0.32, "learning_rate": 3.95476262241073e-06, "loss": 1.255, "step": 10730 }, { "epoch": 0.32, "learning_rate": 3.954564245865129e-06, "loss": 0.9637, "step": 10731 }, { "epoch": 0.32, "learning_rate": 3.9543658554727775e-06, "loss": 1.08, "step": 10732 }, { "epoch": 0.32, "learning_rate": 3.954167451235563e-06, "loss": 1.0528, "step": 10733 }, { "epoch": 0.32, "learning_rate": 3.953969033155375e-06, "loss": 1.0516, "step": 10734 }, { "epoch": 0.32, "learning_rate": 3.953770601234103e-06, "loss": 1.1326, "step": 10735 }, { "epoch": 0.32, "learning_rate": 3.953572155473634e-06, "loss": 1.2197, "step": 10736 }, { "epoch": 0.32, "learning_rate": 3.9533736958758584e-06, "loss": 1.0997, "step": 10737 }, { "epoch": 0.32, "learning_rate": 3.953175222442665e-06, "loss": 1.0736, "step": 10738 }, { "epoch": 0.32, "learning_rate": 3.952976735175944e-06, "loss": 1.1959, "step": 10739 }, { "epoch": 0.32, "learning_rate": 3.952778234077583e-06, "loss": 1.1084, "step": 10740 }, { "epoch": 0.32, "learning_rate": 3.952579719149474e-06, "loss": 1.1194, "step": 10741 }, { "epoch": 0.32, "learning_rate": 3.9523811903935055e-06, "loss": 1.0822, "step": 10742 }, { "epoch": 0.32, "learning_rate": 3.952182647811568e-06, "loss": 1.1827, "step": 10743 }, { "epoch": 0.32, "learning_rate": 3.9519840914055505e-06, "loss": 1.1684, "step": 10744 }, { "epoch": 0.32, "learning_rate": 3.951785521177344e-06, "loss": 1.1509, "step": 10745 }, { "epoch": 0.32, "learning_rate": 3.951586937128838e-06, "loss": 1.101, "step": 10746 }, { "epoch": 0.32, "learning_rate": 3.951388339261923e-06, "loss": 1.1688, "step": 10747 }, { "epoch": 0.32, "learning_rate": 3.951189727578491e-06, "loss": 1.1866, "step": 10748 }, { "epoch": 0.32, "learning_rate": 3.950991102080433e-06, "loss": 1.1227, "step": 10749 }, { "epoch": 0.32, "learning_rate": 3.950792462769636e-06, "loss": 1.1068, "step": 10750 }, { "epoch": 0.32, "learning_rate": 3.950593809647994e-06, "loss": 1.0745, "step": 10751 }, { "epoch": 0.32, "learning_rate": 3.950395142717399e-06, "loss": 1.1141, "step": 10752 }, { "epoch": 0.32, "learning_rate": 3.95019646197974e-06, "loss": 1.0352, "step": 10753 }, { "epoch": 0.32, "learning_rate": 3.949997767436908e-06, "loss": 1.1215, "step": 10754 }, { "epoch": 0.32, "learning_rate": 3.949799059090797e-06, "loss": 1.2484, "step": 10755 }, { "epoch": 0.32, "learning_rate": 3.949600336943296e-06, "loss": 1.2727, "step": 10756 }, { "epoch": 0.32, "learning_rate": 3.9494016009963e-06, "loss": 1.0946, "step": 10757 }, { "epoch": 0.32, "learning_rate": 3.949202851251698e-06, "loss": 1.1368, "step": 10758 }, { "epoch": 0.32, "learning_rate": 3.949004087711381e-06, "loss": 1.2011, "step": 10759 }, { "epoch": 0.32, "learning_rate": 3.948805310377245e-06, "loss": 1.1089, "step": 10760 }, { "epoch": 0.32, "learning_rate": 3.948606519251179e-06, "loss": 1.1993, "step": 10761 }, { "epoch": 0.32, "learning_rate": 3.948407714335078e-06, "loss": 1.1795, "step": 10762 }, { "epoch": 0.32, "learning_rate": 3.9482088956308315e-06, "loss": 1.1678, "step": 10763 }, { "epoch": 0.32, "learning_rate": 3.9480100631403355e-06, "loss": 1.2229, "step": 10764 }, { "epoch": 0.32, "learning_rate": 3.947811216865479e-06, "loss": 1.2427, "step": 10765 }, { "epoch": 0.32, "learning_rate": 3.947612356808159e-06, "loss": 1.1741, "step": 10766 }, { "epoch": 0.32, "learning_rate": 3.947413482970265e-06, "loss": 1.181, "step": 10767 }, { "epoch": 0.32, "learning_rate": 3.947214595353694e-06, "loss": 1.1777, "step": 10768 }, { "epoch": 0.32, "learning_rate": 3.947015693960334e-06, "loss": 1.182, "step": 10769 }, { "epoch": 0.32, "learning_rate": 3.946816778792083e-06, "loss": 1.0992, "step": 10770 }, { "epoch": 0.32, "learning_rate": 3.946617849850833e-06, "loss": 1.009, "step": 10771 }, { "epoch": 0.32, "learning_rate": 3.946418907138478e-06, "loss": 1.1152, "step": 10772 }, { "epoch": 0.32, "learning_rate": 3.946219950656912e-06, "loss": 1.1342, "step": 10773 }, { "epoch": 0.32, "learning_rate": 3.946020980408029e-06, "loss": 1.1835, "step": 10774 }, { "epoch": 0.32, "learning_rate": 3.945821996393721e-06, "loss": 1.1877, "step": 10775 }, { "epoch": 0.32, "learning_rate": 3.945622998615884e-06, "loss": 1.1142, "step": 10776 }, { "epoch": 0.32, "learning_rate": 3.945423987076414e-06, "loss": 0.9841, "step": 10777 }, { "epoch": 0.32, "learning_rate": 3.945224961777202e-06, "loss": 1.1286, "step": 10778 }, { "epoch": 0.32, "learning_rate": 3.945025922720145e-06, "loss": 1.0847, "step": 10779 }, { "epoch": 0.32, "learning_rate": 3.944826869907138e-06, "loss": 1.1782, "step": 10780 }, { "epoch": 0.32, "learning_rate": 3.944627803340074e-06, "loss": 1.2266, "step": 10781 }, { "epoch": 0.32, "learning_rate": 3.94442872302085e-06, "loss": 1.1779, "step": 10782 }, { "epoch": 0.32, "learning_rate": 3.944229628951359e-06, "loss": 1.0611, "step": 10783 }, { "epoch": 0.32, "learning_rate": 3.944030521133499e-06, "loss": 1.0989, "step": 10784 }, { "epoch": 0.32, "learning_rate": 3.9438313995691624e-06, "loss": 1.1125, "step": 10785 }, { "epoch": 0.32, "learning_rate": 3.9436322642602474e-06, "loss": 1.1202, "step": 10786 }, { "epoch": 0.32, "learning_rate": 3.943433115208648e-06, "loss": 1.1345, "step": 10787 }, { "epoch": 0.32, "learning_rate": 3.943233952416261e-06, "loss": 1.0759, "step": 10788 }, { "epoch": 0.33, "learning_rate": 3.943034775884981e-06, "loss": 1.1689, "step": 10789 }, { "epoch": 0.33, "learning_rate": 3.942835585616706e-06, "loss": 1.0616, "step": 10790 }, { "epoch": 0.33, "learning_rate": 3.94263638161333e-06, "loss": 1.1753, "step": 10791 }, { "epoch": 0.33, "learning_rate": 3.942437163876751e-06, "loss": 1.0539, "step": 10792 }, { "epoch": 0.33, "learning_rate": 3.942237932408865e-06, "loss": 1.2488, "step": 10793 }, { "epoch": 0.33, "learning_rate": 3.942038687211568e-06, "loss": 1.1293, "step": 10794 }, { "epoch": 0.33, "learning_rate": 3.9418394282867575e-06, "loss": 1.1611, "step": 10795 }, { "epoch": 0.33, "learning_rate": 3.941640155636331e-06, "loss": 1.1161, "step": 10796 }, { "epoch": 0.33, "learning_rate": 3.941440869262183e-06, "loss": 1.2592, "step": 10797 }, { "epoch": 0.33, "learning_rate": 3.941241569166212e-06, "loss": 1.0863, "step": 10798 }, { "epoch": 0.33, "learning_rate": 3.941042255350317e-06, "loss": 1.1343, "step": 10799 }, { "epoch": 0.33, "learning_rate": 3.940842927816393e-06, "loss": 1.327, "step": 10800 }, { "epoch": 0.33, "learning_rate": 3.940643586566338e-06, "loss": 1.1729, "step": 10801 }, { "epoch": 0.33, "learning_rate": 3.9404442316020495e-06, "loss": 1.1735, "step": 10802 }, { "epoch": 0.33, "learning_rate": 3.940244862925427e-06, "loss": 1.0878, "step": 10803 }, { "epoch": 0.33, "learning_rate": 3.940045480538366e-06, "loss": 1.1334, "step": 10804 }, { "epoch": 0.33, "learning_rate": 3.939846084442765e-06, "loss": 1.204, "step": 10805 }, { "epoch": 0.33, "learning_rate": 3.939646674640525e-06, "loss": 1.1739, "step": 10806 }, { "epoch": 0.33, "learning_rate": 3.93944725113354e-06, "loss": 1.1594, "step": 10807 }, { "epoch": 0.33, "learning_rate": 3.9392478139237115e-06, "loss": 1.0867, "step": 10808 }, { "epoch": 0.33, "learning_rate": 3.939048363012936e-06, "loss": 1.1806, "step": 10809 }, { "epoch": 0.33, "learning_rate": 3.938848898403114e-06, "loss": 1.2643, "step": 10810 }, { "epoch": 0.33, "learning_rate": 3.9386494200961425e-06, "loss": 1.1063, "step": 10811 }, { "epoch": 0.33, "learning_rate": 3.9384499280939225e-06, "loss": 1.2484, "step": 10812 }, { "epoch": 0.33, "learning_rate": 3.938250422398351e-06, "loss": 1.0979, "step": 10813 }, { "epoch": 0.33, "learning_rate": 3.938050903011329e-06, "loss": 1.1427, "step": 10814 }, { "epoch": 0.33, "learning_rate": 3.937851369934755e-06, "loss": 1.1973, "step": 10815 }, { "epoch": 0.33, "learning_rate": 3.937651823170528e-06, "loss": 1.0704, "step": 10816 }, { "epoch": 0.33, "learning_rate": 3.937452262720548e-06, "loss": 1.205, "step": 10817 }, { "epoch": 0.33, "learning_rate": 3.937252688586714e-06, "loss": 1.0963, "step": 10818 }, { "epoch": 0.33, "learning_rate": 3.937053100770928e-06, "loss": 1.1598, "step": 10819 }, { "epoch": 0.33, "learning_rate": 3.936853499275089e-06, "loss": 1.1053, "step": 10820 }, { "epoch": 0.33, "learning_rate": 3.936653884101095e-06, "loss": 1.0992, "step": 10821 }, { "epoch": 0.33, "learning_rate": 3.936454255250849e-06, "loss": 0.9929, "step": 10822 }, { "epoch": 0.33, "learning_rate": 3.93625461272625e-06, "loss": 1.2273, "step": 10823 }, { "epoch": 0.33, "learning_rate": 3.936054956529199e-06, "loss": 1.3809, "step": 10824 }, { "epoch": 0.33, "learning_rate": 3.935855286661596e-06, "loss": 1.2554, "step": 10825 }, { "epoch": 0.33, "learning_rate": 3.9356556031253425e-06, "loss": 1.0939, "step": 10826 }, { "epoch": 0.33, "learning_rate": 3.9354559059223396e-06, "loss": 1.1232, "step": 10827 }, { "epoch": 0.33, "learning_rate": 3.935256195054487e-06, "loss": 1.0787, "step": 10828 }, { "epoch": 0.33, "learning_rate": 3.935056470523687e-06, "loss": 1.2544, "step": 10829 }, { "epoch": 0.33, "learning_rate": 3.934856732331841e-06, "loss": 1.0881, "step": 10830 }, { "epoch": 0.33, "learning_rate": 3.934656980480849e-06, "loss": 1.0731, "step": 10831 }, { "epoch": 0.33, "learning_rate": 3.934457214972614e-06, "loss": 0.9772, "step": 10832 }, { "epoch": 0.33, "learning_rate": 3.934257435809037e-06, "loss": 1.1126, "step": 10833 }, { "epoch": 0.33, "learning_rate": 3.934057642992021e-06, "loss": 1.1791, "step": 10834 }, { "epoch": 0.33, "learning_rate": 3.933857836523465e-06, "loss": 1.2272, "step": 10835 }, { "epoch": 0.33, "learning_rate": 3.933658016405274e-06, "loss": 1.1739, "step": 10836 }, { "epoch": 0.33, "learning_rate": 3.93345818263935e-06, "loss": 1.2311, "step": 10837 }, { "epoch": 0.33, "learning_rate": 3.933258335227593e-06, "loss": 1.2527, "step": 10838 }, { "epoch": 0.33, "learning_rate": 3.933058474171908e-06, "loss": 1.0889, "step": 10839 }, { "epoch": 0.33, "learning_rate": 3.9328585994741965e-06, "loss": 1.1902, "step": 10840 }, { "epoch": 0.33, "learning_rate": 3.93265871113636e-06, "loss": 1.0881, "step": 10841 }, { "epoch": 0.33, "learning_rate": 3.9324588091603035e-06, "loss": 1.1936, "step": 10842 }, { "epoch": 0.33, "learning_rate": 3.932258893547929e-06, "loss": 1.1523, "step": 10843 }, { "epoch": 0.33, "learning_rate": 3.932058964301139e-06, "loss": 1.1624, "step": 10844 }, { "epoch": 0.33, "learning_rate": 3.931859021421838e-06, "loss": 1.051, "step": 10845 }, { "epoch": 0.33, "learning_rate": 3.931659064911928e-06, "loss": 1.1912, "step": 10846 }, { "epoch": 0.33, "learning_rate": 3.931459094773314e-06, "loss": 1.1533, "step": 10847 }, { "epoch": 0.33, "learning_rate": 3.931259111007899e-06, "loss": 1.171, "step": 10848 }, { "epoch": 0.33, "learning_rate": 3.931059113617587e-06, "loss": 1.1191, "step": 10849 }, { "epoch": 0.33, "learning_rate": 3.93085910260428e-06, "loss": 1.0244, "step": 10850 }, { "epoch": 0.33, "learning_rate": 3.930659077969884e-06, "loss": 1.1515, "step": 10851 }, { "epoch": 0.33, "learning_rate": 3.930459039716304e-06, "loss": 1.1637, "step": 10852 }, { "epoch": 0.33, "learning_rate": 3.930258987845441e-06, "loss": 1.0787, "step": 10853 }, { "epoch": 0.33, "learning_rate": 3.930058922359202e-06, "loss": 1.1429, "step": 10854 }, { "epoch": 0.33, "learning_rate": 3.929858843259491e-06, "loss": 1.1463, "step": 10855 }, { "epoch": 0.33, "learning_rate": 3.929658750548212e-06, "loss": 1.1321, "step": 10856 }, { "epoch": 0.33, "learning_rate": 3.92945864422727e-06, "loss": 1.1346, "step": 10857 }, { "epoch": 0.33, "learning_rate": 3.92925852429857e-06, "loss": 1.1371, "step": 10858 }, { "epoch": 0.33, "learning_rate": 3.929058390764018e-06, "loss": 1.1436, "step": 10859 }, { "epoch": 0.33, "learning_rate": 3.928858243625519e-06, "loss": 1.1039, "step": 10860 }, { "epoch": 0.33, "learning_rate": 3.928658082884976e-06, "loss": 1.1871, "step": 10861 }, { "epoch": 0.33, "learning_rate": 3.928457908544297e-06, "loss": 1.1142, "step": 10862 }, { "epoch": 0.33, "learning_rate": 3.928257720605387e-06, "loss": 1.2249, "step": 10863 }, { "epoch": 0.33, "learning_rate": 3.928057519070151e-06, "loss": 1.1114, "step": 10864 }, { "epoch": 0.33, "learning_rate": 3.927857303940495e-06, "loss": 1.1273, "step": 10865 }, { "epoch": 0.33, "learning_rate": 3.927657075218326e-06, "loss": 1.1594, "step": 10866 }, { "epoch": 0.33, "learning_rate": 3.927456832905548e-06, "loss": 1.1869, "step": 10867 }, { "epoch": 0.33, "learning_rate": 3.927256577004069e-06, "loss": 1.131, "step": 10868 }, { "epoch": 0.33, "learning_rate": 3.927056307515795e-06, "loss": 1.1384, "step": 10869 }, { "epoch": 0.33, "learning_rate": 3.926856024442632e-06, "loss": 1.093, "step": 10870 }, { "epoch": 0.33, "learning_rate": 3.926655727786487e-06, "loss": 1.0601, "step": 10871 }, { "epoch": 0.33, "learning_rate": 3.926455417549266e-06, "loss": 1.0828, "step": 10872 }, { "epoch": 0.33, "learning_rate": 3.926255093732877e-06, "loss": 1.2162, "step": 10873 }, { "epoch": 0.33, "learning_rate": 3.926054756339226e-06, "loss": 1.2398, "step": 10874 }, { "epoch": 0.33, "learning_rate": 3.925854405370222e-06, "loss": 1.176, "step": 10875 }, { "epoch": 0.33, "learning_rate": 3.9256540408277686e-06, "loss": 1.1324, "step": 10876 }, { "epoch": 0.33, "learning_rate": 3.925453662713777e-06, "loss": 1.1017, "step": 10877 }, { "epoch": 0.33, "learning_rate": 3.925253271030152e-06, "loss": 1.1099, "step": 10878 }, { "epoch": 0.33, "learning_rate": 3.925052865778803e-06, "loss": 1.1559, "step": 10879 }, { "epoch": 0.33, "learning_rate": 3.9248524469616365e-06, "loss": 1.1293, "step": 10880 }, { "epoch": 0.33, "learning_rate": 3.924652014580561e-06, "loss": 1.1293, "step": 10881 }, { "epoch": 0.33, "learning_rate": 3.924451568637485e-06, "loss": 1.0853, "step": 10882 }, { "epoch": 0.33, "learning_rate": 3.924251109134315e-06, "loss": 1.1863, "step": 10883 }, { "epoch": 0.33, "learning_rate": 3.924050636072961e-06, "loss": 1.0093, "step": 10884 }, { "epoch": 0.33, "learning_rate": 3.923850149455332e-06, "loss": 1.0979, "step": 10885 }, { "epoch": 0.33, "learning_rate": 3.923649649283333e-06, "loss": 1.1603, "step": 10886 }, { "epoch": 0.33, "learning_rate": 3.923449135558877e-06, "loss": 1.0992, "step": 10887 }, { "epoch": 0.33, "learning_rate": 3.92324860828387e-06, "loss": 1.1294, "step": 10888 }, { "epoch": 0.33, "learning_rate": 3.923048067460221e-06, "loss": 1.0845, "step": 10889 }, { "epoch": 0.33, "learning_rate": 3.922847513089841e-06, "loss": 1.0802, "step": 10890 }, { "epoch": 0.33, "learning_rate": 3.922646945174638e-06, "loss": 1.0969, "step": 10891 }, { "epoch": 0.33, "learning_rate": 3.922446363716521e-06, "loss": 1.1499, "step": 10892 }, { "epoch": 0.33, "learning_rate": 3.922245768717399e-06, "loss": 1.1916, "step": 10893 }, { "epoch": 0.33, "learning_rate": 3.9220451601791824e-06, "loss": 1.14, "step": 10894 }, { "epoch": 0.33, "learning_rate": 3.921844538103781e-06, "loss": 1.0661, "step": 10895 }, { "epoch": 0.33, "learning_rate": 3.921643902493104e-06, "loss": 1.1312, "step": 10896 }, { "epoch": 0.33, "learning_rate": 3.921443253349063e-06, "loss": 1.1139, "step": 10897 }, { "epoch": 0.33, "learning_rate": 3.921242590673565e-06, "loss": 1.1827, "step": 10898 }, { "epoch": 0.33, "learning_rate": 3.921041914468523e-06, "loss": 1.1291, "step": 10899 }, { "epoch": 0.33, "learning_rate": 3.920841224735847e-06, "loss": 1.1379, "step": 10900 }, { "epoch": 0.33, "learning_rate": 3.9206405214774455e-06, "loss": 1.187, "step": 10901 }, { "epoch": 0.33, "learning_rate": 3.920439804695232e-06, "loss": 1.1955, "step": 10902 }, { "epoch": 0.33, "learning_rate": 3.920239074391114e-06, "loss": 1.0866, "step": 10903 }, { "epoch": 0.33, "learning_rate": 3.920038330567005e-06, "loss": 1.1343, "step": 10904 }, { "epoch": 0.33, "learning_rate": 3.919837573224815e-06, "loss": 1.2744, "step": 10905 }, { "epoch": 0.33, "learning_rate": 3.919636802366454e-06, "loss": 1.0972, "step": 10906 }, { "epoch": 0.33, "learning_rate": 3.919436017993836e-06, "loss": 1.1439, "step": 10907 }, { "epoch": 0.33, "learning_rate": 3.91923522010887e-06, "loss": 1.1313, "step": 10908 }, { "epoch": 0.33, "learning_rate": 3.919034408713468e-06, "loss": 1.1545, "step": 10909 }, { "epoch": 0.33, "learning_rate": 3.9188335838095424e-06, "loss": 1.1577, "step": 10910 }, { "epoch": 0.33, "learning_rate": 3.918632745399004e-06, "loss": 1.1662, "step": 10911 }, { "epoch": 0.33, "learning_rate": 3.918431893483765e-06, "loss": 1.0966, "step": 10912 }, { "epoch": 0.33, "learning_rate": 3.918231028065738e-06, "loss": 1.1461, "step": 10913 }, { "epoch": 0.33, "learning_rate": 3.9180301491468344e-06, "loss": 1.1171, "step": 10914 }, { "epoch": 0.33, "learning_rate": 3.917829256728967e-06, "loss": 1.1773, "step": 10915 }, { "epoch": 0.33, "learning_rate": 3.917628350814048e-06, "loss": 1.1157, "step": 10916 }, { "epoch": 0.33, "learning_rate": 3.917427431403989e-06, "loss": 1.2025, "step": 10917 }, { "epoch": 0.33, "learning_rate": 3.917226498500704e-06, "loss": 1.1644, "step": 10918 }, { "epoch": 0.33, "learning_rate": 3.917025552106105e-06, "loss": 1.0464, "step": 10919 }, { "epoch": 0.33, "learning_rate": 3.916824592222106e-06, "loss": 1.1509, "step": 10920 }, { "epoch": 0.33, "learning_rate": 3.916623618850618e-06, "loss": 1.0831, "step": 10921 }, { "epoch": 0.33, "learning_rate": 3.916422631993557e-06, "loss": 1.1701, "step": 10922 }, { "epoch": 0.33, "learning_rate": 3.916221631652834e-06, "loss": 1.1749, "step": 10923 }, { "epoch": 0.33, "learning_rate": 3.9160206178303625e-06, "loss": 1.2527, "step": 10924 }, { "epoch": 0.33, "learning_rate": 3.915819590528057e-06, "loss": 1.0112, "step": 10925 }, { "epoch": 0.33, "learning_rate": 3.915618549747831e-06, "loss": 1.1169, "step": 10926 }, { "epoch": 0.33, "learning_rate": 3.915417495491599e-06, "loss": 1.1528, "step": 10927 }, { "epoch": 0.33, "learning_rate": 3.915216427761273e-06, "loss": 1.1495, "step": 10928 }, { "epoch": 0.33, "learning_rate": 3.915015346558769e-06, "loss": 1.1658, "step": 10929 }, { "epoch": 0.33, "learning_rate": 3.914814251886e-06, "loss": 1.1148, "step": 10930 }, { "epoch": 0.33, "learning_rate": 3.914613143744881e-06, "loss": 1.2205, "step": 10931 }, { "epoch": 0.33, "learning_rate": 3.914412022137325e-06, "loss": 1.1436, "step": 10932 }, { "epoch": 0.33, "learning_rate": 3.9142108870652494e-06, "loss": 1.0737, "step": 10933 }, { "epoch": 0.33, "learning_rate": 3.914009738530567e-06, "loss": 1.0587, "step": 10934 }, { "epoch": 0.33, "learning_rate": 3.913808576535192e-06, "loss": 1.1332, "step": 10935 }, { "epoch": 0.33, "learning_rate": 3.91360740108104e-06, "loss": 1.0494, "step": 10936 }, { "epoch": 0.33, "learning_rate": 3.913406212170028e-06, "loss": 1.1707, "step": 10937 }, { "epoch": 0.33, "learning_rate": 3.913205009804069e-06, "loss": 1.0434, "step": 10938 }, { "epoch": 0.33, "learning_rate": 3.9130037939850775e-06, "loss": 1.1667, "step": 10939 }, { "epoch": 0.33, "learning_rate": 3.912802564714972e-06, "loss": 1.1873, "step": 10940 }, { "epoch": 0.33, "learning_rate": 3.912601321995666e-06, "loss": 1.1406, "step": 10941 }, { "epoch": 0.33, "learning_rate": 3.9124000658290756e-06, "loss": 1.1585, "step": 10942 }, { "epoch": 0.33, "learning_rate": 3.912198796217117e-06, "loss": 1.1274, "step": 10943 }, { "epoch": 0.33, "learning_rate": 3.911997513161706e-06, "loss": 1.0986, "step": 10944 }, { "epoch": 0.33, "learning_rate": 3.9117962166647585e-06, "loss": 1.1681, "step": 10945 }, { "epoch": 0.33, "learning_rate": 3.911594906728191e-06, "loss": 1.1573, "step": 10946 }, { "epoch": 0.33, "learning_rate": 3.91139358335392e-06, "loss": 1.0529, "step": 10947 }, { "epoch": 0.33, "learning_rate": 3.911192246543862e-06, "loss": 1.1249, "step": 10948 }, { "epoch": 0.33, "learning_rate": 3.910990896299933e-06, "loss": 1.2061, "step": 10949 }, { "epoch": 0.33, "learning_rate": 3.910789532624051e-06, "loss": 1.1498, "step": 10950 }, { "epoch": 0.33, "learning_rate": 3.9105881555181315e-06, "loss": 1.1458, "step": 10951 }, { "epoch": 0.33, "learning_rate": 3.910386764984092e-06, "loss": 1.0166, "step": 10952 }, { "epoch": 0.33, "learning_rate": 3.91018536102385e-06, "loss": 1.0695, "step": 10953 }, { "epoch": 0.33, "learning_rate": 3.909983943639322e-06, "loss": 1.1553, "step": 10954 }, { "epoch": 0.33, "learning_rate": 3.909782512832427e-06, "loss": 1.1011, "step": 10955 }, { "epoch": 0.33, "learning_rate": 3.909581068605081e-06, "loss": 1.0421, "step": 10956 }, { "epoch": 0.33, "learning_rate": 3.909379610959202e-06, "loss": 1.1918, "step": 10957 }, { "epoch": 0.33, "learning_rate": 3.909178139896707e-06, "loss": 1.0906, "step": 10958 }, { "epoch": 0.33, "learning_rate": 3.908976655419517e-06, "loss": 1.1024, "step": 10959 }, { "epoch": 0.33, "learning_rate": 3.908775157529546e-06, "loss": 1.1265, "step": 10960 }, { "epoch": 0.33, "learning_rate": 3.908573646228715e-06, "loss": 1.231, "step": 10961 }, { "epoch": 0.33, "learning_rate": 3.9083721215189395e-06, "loss": 1.1401, "step": 10962 }, { "epoch": 0.33, "learning_rate": 3.908170583402141e-06, "loss": 1.1447, "step": 10963 }, { "epoch": 0.33, "learning_rate": 3.907969031880238e-06, "loss": 1.1812, "step": 10964 }, { "epoch": 0.33, "learning_rate": 3.907767466955146e-06, "loss": 1.1561, "step": 10965 }, { "epoch": 0.33, "learning_rate": 3.907565888628786e-06, "loss": 1.1117, "step": 10966 }, { "epoch": 0.33, "learning_rate": 3.907364296903077e-06, "loss": 1.1886, "step": 10967 }, { "epoch": 0.33, "learning_rate": 3.907162691779938e-06, "loss": 1.1505, "step": 10968 }, { "epoch": 0.33, "learning_rate": 3.906961073261287e-06, "loss": 1.1041, "step": 10969 }, { "epoch": 0.33, "learning_rate": 3.906759441349045e-06, "loss": 1.209, "step": 10970 }, { "epoch": 0.33, "learning_rate": 3.9065577960451306e-06, "loss": 1.1006, "step": 10971 }, { "epoch": 0.33, "learning_rate": 3.906356137351464e-06, "loss": 1.1075, "step": 10972 }, { "epoch": 0.33, "learning_rate": 3.906154465269962e-06, "loss": 1.2614, "step": 10973 }, { "epoch": 0.33, "learning_rate": 3.90595277980255e-06, "loss": 1.1558, "step": 10974 }, { "epoch": 0.33, "learning_rate": 3.905751080951142e-06, "loss": 1.0662, "step": 10975 }, { "epoch": 0.33, "learning_rate": 3.905549368717662e-06, "loss": 1.1572, "step": 10976 }, { "epoch": 0.33, "learning_rate": 3.905347643104028e-06, "loss": 1.1273, "step": 10977 }, { "epoch": 0.33, "learning_rate": 3.905145904112162e-06, "loss": 1.0271, "step": 10978 }, { "epoch": 0.33, "learning_rate": 3.904944151743984e-06, "loss": 1.0955, "step": 10979 }, { "epoch": 0.33, "learning_rate": 3.904742386001413e-06, "loss": 1.1658, "step": 10980 }, { "epoch": 0.33, "learning_rate": 3.904540606886372e-06, "loss": 1.1042, "step": 10981 }, { "epoch": 0.33, "learning_rate": 3.904338814400781e-06, "loss": 1.0578, "step": 10982 }, { "epoch": 0.33, "learning_rate": 3.904137008546562e-06, "loss": 1.2068, "step": 10983 }, { "epoch": 0.33, "learning_rate": 3.903935189325633e-06, "loss": 1.1382, "step": 10984 }, { "epoch": 0.33, "learning_rate": 3.903733356739918e-06, "loss": 1.074, "step": 10985 }, { "epoch": 0.33, "learning_rate": 3.9035315107913364e-06, "loss": 1.0867, "step": 10986 }, { "epoch": 0.33, "learning_rate": 3.903329651481812e-06, "loss": 1.1451, "step": 10987 }, { "epoch": 0.33, "learning_rate": 3.903127778813265e-06, "loss": 1.1182, "step": 10988 }, { "epoch": 0.33, "learning_rate": 3.902925892787617e-06, "loss": 1.1448, "step": 10989 }, { "epoch": 0.33, "learning_rate": 3.902723993406791e-06, "loss": 1.0616, "step": 10990 }, { "epoch": 0.33, "learning_rate": 3.902522080672707e-06, "loss": 1.1281, "step": 10991 }, { "epoch": 0.33, "learning_rate": 3.9023201545872885e-06, "loss": 1.1979, "step": 10992 }, { "epoch": 0.33, "learning_rate": 3.9021182151524574e-06, "loss": 1.1438, "step": 10993 }, { "epoch": 0.33, "learning_rate": 3.901916262370137e-06, "loss": 1.203, "step": 10994 }, { "epoch": 0.33, "learning_rate": 3.9017142962422485e-06, "loss": 1.1408, "step": 10995 }, { "epoch": 0.33, "learning_rate": 3.9015123167707145e-06, "loss": 1.2086, "step": 10996 }, { "epoch": 0.33, "learning_rate": 3.901310323957459e-06, "loss": 1.0483, "step": 10997 }, { "epoch": 0.33, "learning_rate": 3.901108317804404e-06, "loss": 1.0914, "step": 10998 }, { "epoch": 0.33, "learning_rate": 3.9009062983134725e-06, "loss": 1.1232, "step": 10999 }, { "epoch": 0.33, "learning_rate": 3.900704265486588e-06, "loss": 1.114, "step": 11000 }, { "epoch": 0.33, "learning_rate": 3.900502219325672e-06, "loss": 1.1238, "step": 11001 }, { "epoch": 0.33, "learning_rate": 3.900300159832652e-06, "loss": 1.1086, "step": 11002 }, { "epoch": 0.33, "learning_rate": 3.900098087009447e-06, "loss": 1.1058, "step": 11003 }, { "epoch": 0.33, "learning_rate": 3.899896000857982e-06, "loss": 1.0587, "step": 11004 }, { "epoch": 0.33, "learning_rate": 3.899693901380183e-06, "loss": 1.1679, "step": 11005 }, { "epoch": 0.33, "learning_rate": 3.899491788577971e-06, "loss": 1.2256, "step": 11006 }, { "epoch": 0.33, "learning_rate": 3.899289662453272e-06, "loss": 1.118, "step": 11007 }, { "epoch": 0.33, "learning_rate": 3.899087523008008e-06, "loss": 1.1601, "step": 11008 }, { "epoch": 0.33, "learning_rate": 3.8988853702441066e-06, "loss": 1.158, "step": 11009 }, { "epoch": 0.33, "learning_rate": 3.898683204163489e-06, "loss": 1.1161, "step": 11010 }, { "epoch": 0.33, "learning_rate": 3.898481024768082e-06, "loss": 1.0836, "step": 11011 }, { "epoch": 0.33, "learning_rate": 3.898278832059807e-06, "loss": 1.1649, "step": 11012 }, { "epoch": 0.33, "learning_rate": 3.898076626040592e-06, "loss": 1.0999, "step": 11013 }, { "epoch": 0.33, "learning_rate": 3.897874406712362e-06, "loss": 1.0475, "step": 11014 }, { "epoch": 0.33, "learning_rate": 3.897672174077039e-06, "loss": 1.1527, "step": 11015 }, { "epoch": 0.33, "learning_rate": 3.897469928136552e-06, "loss": 1.0234, "step": 11016 }, { "epoch": 0.33, "learning_rate": 3.897267668892823e-06, "loss": 1.1157, "step": 11017 }, { "epoch": 0.33, "learning_rate": 3.897065396347779e-06, "loss": 1.2357, "step": 11018 }, { "epoch": 0.33, "learning_rate": 3.896863110503345e-06, "loss": 1.2197, "step": 11019 }, { "epoch": 0.33, "learning_rate": 3.896660811361448e-06, "loss": 1.1298, "step": 11020 }, { "epoch": 0.33, "learning_rate": 3.896458498924012e-06, "loss": 1.0786, "step": 11021 }, { "epoch": 0.33, "learning_rate": 3.896256173192963e-06, "loss": 1.2079, "step": 11022 }, { "epoch": 0.33, "learning_rate": 3.896053834170228e-06, "loss": 1.1567, "step": 11023 }, { "epoch": 0.33, "learning_rate": 3.895851481857734e-06, "loss": 1.1675, "step": 11024 }, { "epoch": 0.33, "learning_rate": 3.895649116257405e-06, "loss": 1.1482, "step": 11025 }, { "epoch": 0.33, "learning_rate": 3.8954467373711694e-06, "loss": 1.1077, "step": 11026 }, { "epoch": 0.33, "learning_rate": 3.8952443452009524e-06, "loss": 1.1468, "step": 11027 }, { "epoch": 0.33, "learning_rate": 3.895041939748682e-06, "loss": 1.1542, "step": 11028 }, { "epoch": 0.33, "learning_rate": 3.894839521016283e-06, "loss": 1.0548, "step": 11029 }, { "epoch": 0.33, "learning_rate": 3.894637089005684e-06, "loss": 1.2205, "step": 11030 }, { "epoch": 0.33, "learning_rate": 3.8944346437188116e-06, "loss": 1.0577, "step": 11031 }, { "epoch": 0.33, "learning_rate": 3.894232185157592e-06, "loss": 1.0956, "step": 11032 }, { "epoch": 0.33, "learning_rate": 3.894029713323955e-06, "loss": 1.2001, "step": 11033 }, { "epoch": 0.33, "learning_rate": 3.893827228219826e-06, "loss": 1.1174, "step": 11034 }, { "epoch": 0.33, "learning_rate": 3.8936247298471334e-06, "loss": 1.1149, "step": 11035 }, { "epoch": 0.33, "learning_rate": 3.893422218207804e-06, "loss": 1.2144, "step": 11036 }, { "epoch": 0.33, "learning_rate": 3.893219693303767e-06, "loss": 1.1898, "step": 11037 }, { "epoch": 0.33, "learning_rate": 3.893017155136949e-06, "loss": 1.0565, "step": 11038 }, { "epoch": 0.33, "learning_rate": 3.892814603709278e-06, "loss": 1.1891, "step": 11039 }, { "epoch": 0.33, "learning_rate": 3.8926120390226835e-06, "loss": 1.0474, "step": 11040 }, { "epoch": 0.33, "learning_rate": 3.892409461079093e-06, "loss": 1.0369, "step": 11041 }, { "epoch": 0.33, "learning_rate": 3.892206869880435e-06, "loss": 1.1552, "step": 11042 }, { "epoch": 0.33, "learning_rate": 3.8920042654286375e-06, "loss": 1.2449, "step": 11043 }, { "epoch": 0.33, "learning_rate": 3.8918016477256306e-06, "loss": 1.1164, "step": 11044 }, { "epoch": 0.33, "learning_rate": 3.891599016773342e-06, "loss": 1.1534, "step": 11045 }, { "epoch": 0.33, "learning_rate": 3.891396372573701e-06, "loss": 1.0412, "step": 11046 }, { "epoch": 0.33, "learning_rate": 3.891193715128637e-06, "loss": 1.2437, "step": 11047 }, { "epoch": 0.33, "learning_rate": 3.890991044440078e-06, "loss": 1.2574, "step": 11048 }, { "epoch": 0.33, "learning_rate": 3.890788360509955e-06, "loss": 1.3854, "step": 11049 }, { "epoch": 0.33, "learning_rate": 3.890585663340196e-06, "loss": 1.2154, "step": 11050 }, { "epoch": 0.33, "learning_rate": 3.8903829529327316e-06, "loss": 1.1752, "step": 11051 }, { "epoch": 0.33, "learning_rate": 3.890180229289492e-06, "loss": 1.0632, "step": 11052 }, { "epoch": 0.33, "learning_rate": 3.889977492412404e-06, "loss": 1.0321, "step": 11053 }, { "epoch": 0.33, "learning_rate": 3.889774742303402e-06, "loss": 1.0673, "step": 11054 }, { "epoch": 0.33, "learning_rate": 3.889571978964413e-06, "loss": 1.2627, "step": 11055 }, { "epoch": 0.33, "learning_rate": 3.889369202397367e-06, "loss": 1.1893, "step": 11056 }, { "epoch": 0.33, "learning_rate": 3.889166412604196e-06, "loss": 1.1663, "step": 11057 }, { "epoch": 0.33, "learning_rate": 3.88896360958683e-06, "loss": 1.1512, "step": 11058 }, { "epoch": 0.33, "learning_rate": 3.888760793347199e-06, "loss": 1.1716, "step": 11059 }, { "epoch": 0.33, "learning_rate": 3.888557963887235e-06, "loss": 0.9955, "step": 11060 }, { "epoch": 0.33, "learning_rate": 3.888355121208867e-06, "loss": 1.0602, "step": 11061 }, { "epoch": 0.33, "learning_rate": 3.8881522653140276e-06, "loss": 1.1102, "step": 11062 }, { "epoch": 0.33, "learning_rate": 3.887949396204646e-06, "loss": 1.1292, "step": 11063 }, { "epoch": 0.33, "learning_rate": 3.887746513882656e-06, "loss": 1.0889, "step": 11064 }, { "epoch": 0.33, "learning_rate": 3.887543618349987e-06, "loss": 1.14, "step": 11065 }, { "epoch": 0.33, "learning_rate": 3.887340709608571e-06, "loss": 1.1176, "step": 11066 }, { "epoch": 0.33, "learning_rate": 3.88713778766034e-06, "loss": 1.1523, "step": 11067 }, { "epoch": 0.33, "learning_rate": 3.886934852507225e-06, "loss": 1.1685, "step": 11068 }, { "epoch": 0.33, "learning_rate": 3.886731904151157e-06, "loss": 1.0817, "step": 11069 }, { "epoch": 0.33, "learning_rate": 3.886528942594071e-06, "loss": 1.0958, "step": 11070 }, { "epoch": 0.33, "learning_rate": 3.886325967837896e-06, "loss": 1.0826, "step": 11071 }, { "epoch": 0.33, "learning_rate": 3.886122979884566e-06, "loss": 1.1169, "step": 11072 }, { "epoch": 0.33, "learning_rate": 3.885919978736012e-06, "loss": 1.1396, "step": 11073 }, { "epoch": 0.33, "learning_rate": 3.885716964394169e-06, "loss": 1.098, "step": 11074 }, { "epoch": 0.33, "learning_rate": 3.885513936860967e-06, "loss": 0.9636, "step": 11075 }, { "epoch": 0.33, "learning_rate": 3.8853108961383396e-06, "loss": 1.1277, "step": 11076 }, { "epoch": 0.33, "learning_rate": 3.885107842228219e-06, "loss": 1.171, "step": 11077 }, { "epoch": 0.33, "learning_rate": 3.884904775132539e-06, "loss": 1.2609, "step": 11078 }, { "epoch": 0.33, "learning_rate": 3.884701694853233e-06, "loss": 1.1462, "step": 11079 }, { "epoch": 0.33, "learning_rate": 3.884498601392235e-06, "loss": 1.1155, "step": 11080 }, { "epoch": 0.33, "learning_rate": 3.884295494751475e-06, "loss": 1.2321, "step": 11081 }, { "epoch": 0.33, "learning_rate": 3.884092374932889e-06, "loss": 1.119, "step": 11082 }, { "epoch": 0.33, "learning_rate": 3.883889241938411e-06, "loss": 1.1343, "step": 11083 }, { "epoch": 0.33, "learning_rate": 3.883686095769974e-06, "loss": 1.1751, "step": 11084 }, { "epoch": 0.33, "learning_rate": 3.883482936429511e-06, "loss": 1.1277, "step": 11085 }, { "epoch": 0.33, "learning_rate": 3.883279763918957e-06, "loss": 1.2135, "step": 11086 }, { "epoch": 0.33, "learning_rate": 3.883076578240246e-06, "loss": 1.1093, "step": 11087 }, { "epoch": 0.33, "learning_rate": 3.882873379395312e-06, "loss": 1.198, "step": 11088 }, { "epoch": 0.33, "learning_rate": 3.88267016738609e-06, "loss": 1.1031, "step": 11089 }, { "epoch": 0.33, "learning_rate": 3.882466942214513e-06, "loss": 1.1456, "step": 11090 }, { "epoch": 0.33, "learning_rate": 3.882263703882517e-06, "loss": 1.1932, "step": 11091 }, { "epoch": 0.33, "learning_rate": 3.882060452392035e-06, "loss": 1.1139, "step": 11092 }, { "epoch": 0.33, "learning_rate": 3.881857187745006e-06, "loss": 1.1937, "step": 11093 }, { "epoch": 0.33, "learning_rate": 3.88165390994336e-06, "loss": 1.1758, "step": 11094 }, { "epoch": 0.33, "learning_rate": 3.881450618989034e-06, "loss": 1.0729, "step": 11095 }, { "epoch": 0.33, "learning_rate": 3.881247314883964e-06, "loss": 1.2177, "step": 11096 }, { "epoch": 0.33, "learning_rate": 3.881043997630085e-06, "loss": 1.1976, "step": 11097 }, { "epoch": 0.33, "learning_rate": 3.880840667229332e-06, "loss": 1.3033, "step": 11098 }, { "epoch": 0.33, "learning_rate": 3.880637323683641e-06, "loss": 1.23, "step": 11099 }, { "epoch": 0.33, "learning_rate": 3.880433966994948e-06, "loss": 1.1208, "step": 11100 }, { "epoch": 0.33, "learning_rate": 3.880230597165188e-06, "loss": 1.1534, "step": 11101 }, { "epoch": 0.33, "learning_rate": 3.880027214196297e-06, "loss": 1.2073, "step": 11102 }, { "epoch": 0.33, "learning_rate": 3.879823818090213e-06, "loss": 1.2253, "step": 11103 }, { "epoch": 0.33, "learning_rate": 3.879620408848869e-06, "loss": 1.0704, "step": 11104 }, { "epoch": 0.33, "learning_rate": 3.879416986474205e-06, "loss": 1.2636, "step": 11105 }, { "epoch": 0.33, "learning_rate": 3.879213550968154e-06, "loss": 1.0964, "step": 11106 }, { "epoch": 0.33, "learning_rate": 3.8790101023326545e-06, "loss": 1.2516, "step": 11107 }, { "epoch": 0.33, "learning_rate": 3.878806640569644e-06, "loss": 1.1896, "step": 11108 }, { "epoch": 0.33, "learning_rate": 3.878603165681058e-06, "loss": 1.0827, "step": 11109 }, { "epoch": 0.33, "learning_rate": 3.878399677668833e-06, "loss": 1.1724, "step": 11110 }, { "epoch": 0.33, "learning_rate": 3.878196176534907e-06, "loss": 1.1924, "step": 11111 }, { "epoch": 0.33, "learning_rate": 3.877992662281218e-06, "loss": 1.1959, "step": 11112 }, { "epoch": 0.33, "learning_rate": 3.8777891349097025e-06, "loss": 1.1657, "step": 11113 }, { "epoch": 0.33, "learning_rate": 3.877585594422298e-06, "loss": 1.1338, "step": 11114 }, { "epoch": 0.33, "learning_rate": 3.877382040820941e-06, "loss": 1.006, "step": 11115 }, { "epoch": 0.33, "learning_rate": 3.877178474107571e-06, "loss": 1.1519, "step": 11116 }, { "epoch": 0.33, "learning_rate": 3.8769748942841254e-06, "loss": 1.1595, "step": 11117 }, { "epoch": 0.33, "learning_rate": 3.876771301352542e-06, "loss": 1.1678, "step": 11118 }, { "epoch": 0.33, "learning_rate": 3.876567695314759e-06, "loss": 1.1012, "step": 11119 }, { "epoch": 0.33, "learning_rate": 3.876364076172714e-06, "loss": 1.1129, "step": 11120 }, { "epoch": 0.34, "learning_rate": 3.8761604439283464e-06, "loss": 1.1086, "step": 11121 }, { "epoch": 0.34, "learning_rate": 3.875956798583595e-06, "loss": 1.1697, "step": 11122 }, { "epoch": 0.34, "learning_rate": 3.875753140140395e-06, "loss": 1.2659, "step": 11123 }, { "epoch": 0.34, "learning_rate": 3.87554946860069e-06, "loss": 1.1304, "step": 11124 }, { "epoch": 0.34, "learning_rate": 3.875345783966415e-06, "loss": 1.2584, "step": 11125 }, { "epoch": 0.34, "learning_rate": 3.875142086239512e-06, "loss": 1.1909, "step": 11126 }, { "epoch": 0.34, "learning_rate": 3.874938375421917e-06, "loss": 1.0729, "step": 11127 }, { "epoch": 0.34, "learning_rate": 3.874734651515573e-06, "loss": 1.1367, "step": 11128 }, { "epoch": 0.34, "learning_rate": 3.874530914522415e-06, "loss": 1.1304, "step": 11129 }, { "epoch": 0.34, "learning_rate": 3.874327164444386e-06, "loss": 1.2164, "step": 11130 }, { "epoch": 0.34, "learning_rate": 3.8741234012834235e-06, "loss": 1.0798, "step": 11131 }, { "epoch": 0.34, "learning_rate": 3.873919625041469e-06, "loss": 1.1581, "step": 11132 }, { "epoch": 0.34, "learning_rate": 3.873715835720461e-06, "loss": 1.0808, "step": 11133 }, { "epoch": 0.34, "learning_rate": 3.8735120333223394e-06, "loss": 1.1143, "step": 11134 }, { "epoch": 0.34, "learning_rate": 3.873308217849045e-06, "loss": 1.1831, "step": 11135 }, { "epoch": 0.34, "learning_rate": 3.873104389302518e-06, "loss": 1.1085, "step": 11136 }, { "epoch": 0.34, "learning_rate": 3.8729005476846984e-06, "loss": 1.149, "step": 11137 }, { "epoch": 0.34, "learning_rate": 3.872696692997527e-06, "loss": 1.173, "step": 11138 }, { "epoch": 0.34, "learning_rate": 3.872492825242944e-06, "loss": 1.1536, "step": 11139 }, { "epoch": 0.34, "learning_rate": 3.8722889444228896e-06, "loss": 1.0258, "step": 11140 }, { "epoch": 0.34, "learning_rate": 3.872085050539306e-06, "loss": 1.1061, "step": 11141 }, { "epoch": 0.34, "learning_rate": 3.8718811435941335e-06, "loss": 1.1635, "step": 11142 }, { "epoch": 0.34, "learning_rate": 3.871677223589313e-06, "loss": 1.0493, "step": 11143 }, { "epoch": 0.34, "learning_rate": 3.871473290526786e-06, "loss": 1.1886, "step": 11144 }, { "epoch": 0.34, "learning_rate": 3.871269344408495e-06, "loss": 1.2083, "step": 11145 }, { "epoch": 0.34, "learning_rate": 3.871065385236379e-06, "loss": 1.092, "step": 11146 }, { "epoch": 0.34, "learning_rate": 3.870861413012381e-06, "loss": 1.2134, "step": 11147 }, { "epoch": 0.34, "learning_rate": 3.870657427738443e-06, "loss": 1.1082, "step": 11148 }, { "epoch": 0.34, "learning_rate": 3.8704534294165056e-06, "loss": 1.2043, "step": 11149 }, { "epoch": 0.34, "learning_rate": 3.870249418048513e-06, "loss": 1.2813, "step": 11150 }, { "epoch": 0.34, "learning_rate": 3.870045393636405e-06, "loss": 1.1649, "step": 11151 }, { "epoch": 0.34, "learning_rate": 3.869841356182124e-06, "loss": 1.0992, "step": 11152 }, { "epoch": 0.34, "learning_rate": 3.869637305687613e-06, "loss": 1.1323, "step": 11153 }, { "epoch": 0.34, "learning_rate": 3.869433242154816e-06, "loss": 1.1558, "step": 11154 }, { "epoch": 0.34, "learning_rate": 3.869229165585673e-06, "loss": 1.2104, "step": 11155 }, { "epoch": 0.34, "learning_rate": 3.869025075982129e-06, "loss": 1.2797, "step": 11156 }, { "epoch": 0.34, "learning_rate": 3.868820973346125e-06, "loss": 1.0873, "step": 11157 }, { "epoch": 0.34, "learning_rate": 3.8686168576796035e-06, "loss": 1.1499, "step": 11158 }, { "epoch": 0.34, "learning_rate": 3.8684127289845095e-06, "loss": 0.9794, "step": 11159 }, { "epoch": 0.34, "learning_rate": 3.868208587262785e-06, "loss": 1.2089, "step": 11160 }, { "epoch": 0.34, "learning_rate": 3.868004432516374e-06, "loss": 1.2061, "step": 11161 }, { "epoch": 0.34, "learning_rate": 3.86780026474722e-06, "loss": 1.088, "step": 11162 }, { "epoch": 0.34, "learning_rate": 3.867596083957265e-06, "loss": 1.2578, "step": 11163 }, { "epoch": 0.34, "learning_rate": 3.867391890148456e-06, "loss": 1.1431, "step": 11164 }, { "epoch": 0.34, "learning_rate": 3.8671876833227334e-06, "loss": 1.1693, "step": 11165 }, { "epoch": 0.34, "learning_rate": 3.8669834634820425e-06, "loss": 1.1223, "step": 11166 }, { "epoch": 0.34, "learning_rate": 3.8667792306283284e-06, "loss": 1.1407, "step": 11167 }, { "epoch": 0.34, "learning_rate": 3.866574984763533e-06, "loss": 1.0974, "step": 11168 }, { "epoch": 0.34, "learning_rate": 3.866370725889602e-06, "loss": 1.2025, "step": 11169 }, { "epoch": 0.34, "learning_rate": 3.8661664540084805e-06, "loss": 1.1761, "step": 11170 }, { "epoch": 0.34, "learning_rate": 3.865962169122112e-06, "loss": 1.0724, "step": 11171 }, { "epoch": 0.34, "learning_rate": 3.865757871232442e-06, "loss": 1.1078, "step": 11172 }, { "epoch": 0.34, "learning_rate": 3.865553560341414e-06, "loss": 1.2868, "step": 11173 }, { "epoch": 0.34, "learning_rate": 3.8653492364509734e-06, "loss": 1.2222, "step": 11174 }, { "epoch": 0.34, "learning_rate": 3.865144899563067e-06, "loss": 1.1703, "step": 11175 }, { "epoch": 0.34, "learning_rate": 3.864940549679638e-06, "loss": 1.2722, "step": 11176 }, { "epoch": 0.34, "learning_rate": 3.8647361868026325e-06, "loss": 1.1239, "step": 11177 }, { "epoch": 0.34, "learning_rate": 3.864531810933996e-06, "loss": 1.0914, "step": 11178 }, { "epoch": 0.34, "learning_rate": 3.864327422075673e-06, "loss": 1.1594, "step": 11179 }, { "epoch": 0.34, "learning_rate": 3.86412302022961e-06, "loss": 1.2015, "step": 11180 }, { "epoch": 0.34, "learning_rate": 3.863918605397754e-06, "loss": 1.2806, "step": 11181 }, { "epoch": 0.34, "learning_rate": 3.863714177582049e-06, "loss": 1.143, "step": 11182 }, { "epoch": 0.34, "learning_rate": 3.863509736784442e-06, "loss": 1.1278, "step": 11183 }, { "epoch": 0.34, "learning_rate": 3.8633052830068785e-06, "loss": 1.1697, "step": 11184 }, { "epoch": 0.34, "learning_rate": 3.863100816251306e-06, "loss": 1.0391, "step": 11185 }, { "epoch": 0.34, "learning_rate": 3.86289633651967e-06, "loss": 1.1892, "step": 11186 }, { "epoch": 0.34, "learning_rate": 3.862691843813917e-06, "loss": 1.2084, "step": 11187 }, { "epoch": 0.34, "learning_rate": 3.862487338135994e-06, "loss": 1.1029, "step": 11188 }, { "epoch": 0.34, "learning_rate": 3.8622828194878485e-06, "loss": 1.1786, "step": 11189 }, { "epoch": 0.34, "learning_rate": 3.862078287871426e-06, "loss": 1.0912, "step": 11190 }, { "epoch": 0.34, "learning_rate": 3.8618737432886735e-06, "loss": 1.0148, "step": 11191 }, { "epoch": 0.34, "learning_rate": 3.86166918574154e-06, "loss": 1.1644, "step": 11192 }, { "epoch": 0.34, "learning_rate": 3.861464615231971e-06, "loss": 1.1587, "step": 11193 }, { "epoch": 0.34, "learning_rate": 3.861260031761915e-06, "loss": 1.0422, "step": 11194 }, { "epoch": 0.34, "learning_rate": 3.861055435333319e-06, "loss": 1.2136, "step": 11195 }, { "epoch": 0.34, "learning_rate": 3.86085082594813e-06, "loss": 1.0133, "step": 11196 }, { "epoch": 0.34, "learning_rate": 3.860646203608298e-06, "loss": 1.0901, "step": 11197 }, { "epoch": 0.34, "learning_rate": 3.860441568315768e-06, "loss": 1.2172, "step": 11198 }, { "epoch": 0.34, "learning_rate": 3.860236920072491e-06, "loss": 1.1205, "step": 11199 }, { "epoch": 0.34, "learning_rate": 3.860032258880412e-06, "loss": 1.0571, "step": 11200 }, { "epoch": 0.34, "learning_rate": 3.8598275847414825e-06, "loss": 1.0859, "step": 11201 }, { "epoch": 0.34, "learning_rate": 3.859622897657648e-06, "loss": 1.0491, "step": 11202 }, { "epoch": 0.34, "learning_rate": 3.859418197630859e-06, "loss": 1.1083, "step": 11203 }, { "epoch": 0.34, "learning_rate": 3.859213484663064e-06, "loss": 1.0957, "step": 11204 }, { "epoch": 0.34, "learning_rate": 3.8590087587562094e-06, "loss": 1.1376, "step": 11205 }, { "epoch": 0.34, "learning_rate": 3.858804019912248e-06, "loss": 1.2523, "step": 11206 }, { "epoch": 0.34, "learning_rate": 3.858599268133125e-06, "loss": 1.2045, "step": 11207 }, { "epoch": 0.34, "learning_rate": 3.858394503420793e-06, "loss": 1.1159, "step": 11208 }, { "epoch": 0.34, "learning_rate": 3.858189725777198e-06, "loss": 1.1911, "step": 11209 }, { "epoch": 0.34, "learning_rate": 3.857984935204292e-06, "loss": 1.2886, "step": 11210 }, { "epoch": 0.34, "learning_rate": 3.857780131704023e-06, "loss": 1.2128, "step": 11211 }, { "epoch": 0.34, "learning_rate": 3.8575753152783414e-06, "loss": 1.1066, "step": 11212 }, { "epoch": 0.34, "learning_rate": 3.857370485929196e-06, "loss": 1.0425, "step": 11213 }, { "epoch": 0.34, "learning_rate": 3.857165643658538e-06, "loss": 1.1585, "step": 11214 }, { "epoch": 0.34, "learning_rate": 3.856960788468316e-06, "loss": 1.0848, "step": 11215 }, { "epoch": 0.34, "learning_rate": 3.8567559203604805e-06, "loss": 1.1354, "step": 11216 }, { "epoch": 0.34, "learning_rate": 3.856551039336984e-06, "loss": 1.0338, "step": 11217 }, { "epoch": 0.34, "learning_rate": 3.856346145399773e-06, "loss": 1.2699, "step": 11218 }, { "epoch": 0.34, "learning_rate": 3.856141238550801e-06, "loss": 1.2303, "step": 11219 }, { "epoch": 0.34, "learning_rate": 3.855936318792018e-06, "loss": 1.1844, "step": 11220 }, { "epoch": 0.34, "learning_rate": 3.855731386125373e-06, "loss": 1.0306, "step": 11221 }, { "epoch": 0.34, "learning_rate": 3.855526440552818e-06, "loss": 1.1191, "step": 11222 }, { "epoch": 0.34, "learning_rate": 3.855321482076305e-06, "loss": 1.0703, "step": 11223 }, { "epoch": 0.34, "learning_rate": 3.855116510697784e-06, "loss": 1.2028, "step": 11224 }, { "epoch": 0.34, "learning_rate": 3.8549115264192074e-06, "loss": 1.0339, "step": 11225 }, { "epoch": 0.34, "learning_rate": 3.854706529242524e-06, "loss": 1.0765, "step": 11226 }, { "epoch": 0.34, "learning_rate": 3.854501519169688e-06, "loss": 1.1219, "step": 11227 }, { "epoch": 0.34, "learning_rate": 3.854296496202649e-06, "loss": 1.0971, "step": 11228 }, { "epoch": 0.34, "learning_rate": 3.85409146034336e-06, "loss": 1.257, "step": 11229 }, { "epoch": 0.34, "learning_rate": 3.853886411593773e-06, "loss": 1.1918, "step": 11230 }, { "epoch": 0.34, "learning_rate": 3.853681349955839e-06, "loss": 1.1364, "step": 11231 }, { "epoch": 0.34, "learning_rate": 3.85347627543151e-06, "loss": 1.1276, "step": 11232 }, { "epoch": 0.34, "learning_rate": 3.8532711880227396e-06, "loss": 1.1462, "step": 11233 }, { "epoch": 0.34, "learning_rate": 3.853066087731478e-06, "loss": 1.1231, "step": 11234 }, { "epoch": 0.34, "learning_rate": 3.8528609745596805e-06, "loss": 1.188, "step": 11235 }, { "epoch": 0.34, "learning_rate": 3.8526558485092975e-06, "loss": 1.1536, "step": 11236 }, { "epoch": 0.34, "learning_rate": 3.8524507095822816e-06, "loss": 1.1187, "step": 11237 }, { "epoch": 0.34, "learning_rate": 3.852245557780588e-06, "loss": 1.1746, "step": 11238 }, { "epoch": 0.34, "learning_rate": 3.8520403931061654e-06, "loss": 1.0988, "step": 11239 }, { "epoch": 0.34, "learning_rate": 3.851835215560971e-06, "loss": 1.0845, "step": 11240 }, { "epoch": 0.34, "learning_rate": 3.8516300251469565e-06, "loss": 1.221, "step": 11241 }, { "epoch": 0.34, "learning_rate": 3.8514248218660745e-06, "loss": 1.1458, "step": 11242 }, { "epoch": 0.34, "learning_rate": 3.851219605720279e-06, "loss": 1.1812, "step": 11243 }, { "epoch": 0.34, "learning_rate": 3.851014376711524e-06, "loss": 1.1844, "step": 11244 }, { "epoch": 0.34, "learning_rate": 3.8508091348417635e-06, "loss": 1.0787, "step": 11245 }, { "epoch": 0.34, "learning_rate": 3.85060388011295e-06, "loss": 1.0972, "step": 11246 }, { "epoch": 0.34, "learning_rate": 3.8503986125270375e-06, "loss": 1.177, "step": 11247 }, { "epoch": 0.34, "learning_rate": 3.8501933320859806e-06, "loss": 1.1689, "step": 11248 }, { "epoch": 0.34, "learning_rate": 3.849988038791734e-06, "loss": 1.2109, "step": 11249 }, { "epoch": 0.34, "learning_rate": 3.849782732646252e-06, "loss": 1.0764, "step": 11250 }, { "epoch": 0.34, "learning_rate": 3.849577413651488e-06, "loss": 1.1581, "step": 11251 }, { "epoch": 0.34, "learning_rate": 3.8493720818093965e-06, "loss": 1.166, "step": 11252 }, { "epoch": 0.34, "learning_rate": 3.849166737121933e-06, "loss": 1.0887, "step": 11253 }, { "epoch": 0.34, "learning_rate": 3.848961379591052e-06, "loss": 1.2064, "step": 11254 }, { "epoch": 0.34, "learning_rate": 3.8487560092187084e-06, "loss": 1.1936, "step": 11255 }, { "epoch": 0.34, "learning_rate": 3.848550626006857e-06, "loss": 1.1373, "step": 11256 }, { "epoch": 0.34, "learning_rate": 3.848345229957453e-06, "loss": 1.1746, "step": 11257 }, { "epoch": 0.34, "learning_rate": 3.848139821072452e-06, "loss": 1.0573, "step": 11258 }, { "epoch": 0.34, "learning_rate": 3.847934399353809e-06, "loss": 1.177, "step": 11259 }, { "epoch": 0.34, "learning_rate": 3.84772896480348e-06, "loss": 1.1175, "step": 11260 }, { "epoch": 0.34, "learning_rate": 3.8475235174234196e-06, "loss": 1.1229, "step": 11261 }, { "epoch": 0.34, "learning_rate": 3.847318057215585e-06, "loss": 1.1185, "step": 11262 }, { "epoch": 0.34, "learning_rate": 3.8471125841819316e-06, "loss": 1.2097, "step": 11263 }, { "epoch": 0.34, "learning_rate": 3.846907098324415e-06, "loss": 1.044, "step": 11264 }, { "epoch": 0.34, "learning_rate": 3.8467015996449905e-06, "loss": 1.1022, "step": 11265 }, { "epoch": 0.34, "learning_rate": 3.846496088145617e-06, "loss": 1.1812, "step": 11266 }, { "epoch": 0.34, "learning_rate": 3.846290563828249e-06, "loss": 1.1366, "step": 11267 }, { "epoch": 0.34, "learning_rate": 3.846085026694842e-06, "loss": 1.0645, "step": 11268 }, { "epoch": 0.34, "learning_rate": 3.845879476747355e-06, "loss": 1.0046, "step": 11269 }, { "epoch": 0.34, "learning_rate": 3.845673913987743e-06, "loss": 1.1031, "step": 11270 }, { "epoch": 0.34, "learning_rate": 3.845468338417963e-06, "loss": 1.175, "step": 11271 }, { "epoch": 0.34, "learning_rate": 3.845262750039973e-06, "loss": 1.0826, "step": 11272 }, { "epoch": 0.34, "learning_rate": 3.84505714885573e-06, "loss": 1.1688, "step": 11273 }, { "epoch": 0.34, "learning_rate": 3.84485153486719e-06, "loss": 1.1766, "step": 11274 }, { "epoch": 0.34, "learning_rate": 3.844645908076311e-06, "loss": 1.2717, "step": 11275 }, { "epoch": 0.34, "learning_rate": 3.844440268485052e-06, "loss": 1.0822, "step": 11276 }, { "epoch": 0.34, "learning_rate": 3.844234616095367e-06, "loss": 1.118, "step": 11277 }, { "epoch": 0.34, "learning_rate": 3.844028950909218e-06, "loss": 1.2838, "step": 11278 }, { "epoch": 0.34, "learning_rate": 3.84382327292856e-06, "loss": 1.098, "step": 11279 }, { "epoch": 0.34, "learning_rate": 3.8436175821553505e-06, "loss": 1.1099, "step": 11280 }, { "epoch": 0.34, "learning_rate": 3.84341187859155e-06, "loss": 1.311, "step": 11281 }, { "epoch": 0.34, "learning_rate": 3.843206162239114e-06, "loss": 1.1389, "step": 11282 }, { "epoch": 0.34, "learning_rate": 3.843000433100004e-06, "loss": 1.1245, "step": 11283 }, { "epoch": 0.34, "learning_rate": 3.842794691176175e-06, "loss": 1.0717, "step": 11284 }, { "epoch": 0.34, "learning_rate": 3.842588936469588e-06, "loss": 1.1424, "step": 11285 }, { "epoch": 0.34, "learning_rate": 3.842383168982201e-06, "loss": 1.1847, "step": 11286 }, { "epoch": 0.34, "learning_rate": 3.842177388715973e-06, "loss": 1.1407, "step": 11287 }, { "epoch": 0.34, "learning_rate": 3.841971595672863e-06, "loss": 1.128, "step": 11288 }, { "epoch": 0.34, "learning_rate": 3.841765789854829e-06, "loss": 1.1387, "step": 11289 }, { "epoch": 0.34, "learning_rate": 3.841559971263831e-06, "loss": 1.041, "step": 11290 }, { "epoch": 0.34, "learning_rate": 3.841354139901828e-06, "loss": 1.1782, "step": 11291 }, { "epoch": 0.34, "learning_rate": 3.84114829577078e-06, "loss": 1.2205, "step": 11292 }, { "epoch": 0.34, "learning_rate": 3.8409424388726455e-06, "loss": 1.1951, "step": 11293 }, { "epoch": 0.34, "learning_rate": 3.840736569209386e-06, "loss": 1.1729, "step": 11294 }, { "epoch": 0.34, "learning_rate": 3.84053068678296e-06, "loss": 1.1365, "step": 11295 }, { "epoch": 0.34, "learning_rate": 3.840324791595325e-06, "loss": 1.1543, "step": 11296 }, { "epoch": 0.34, "learning_rate": 3.840118883648447e-06, "loss": 1.1616, "step": 11297 }, { "epoch": 0.34, "learning_rate": 3.8399129629442805e-06, "loss": 1.1273, "step": 11298 }, { "epoch": 0.34, "learning_rate": 3.839707029484788e-06, "loss": 1.2728, "step": 11299 }, { "epoch": 0.34, "learning_rate": 3.839501083271931e-06, "loss": 1.2471, "step": 11300 }, { "epoch": 0.34, "learning_rate": 3.839295124307668e-06, "loss": 1.189, "step": 11301 }, { "epoch": 0.34, "learning_rate": 3.83908915259396e-06, "loss": 1.1764, "step": 11302 }, { "epoch": 0.34, "learning_rate": 3.838883168132769e-06, "loss": 1.1628, "step": 11303 }, { "epoch": 0.34, "learning_rate": 3.838677170926055e-06, "loss": 1.1233, "step": 11304 }, { "epoch": 0.34, "learning_rate": 3.838471160975779e-06, "loss": 1.2184, "step": 11305 }, { "epoch": 0.34, "learning_rate": 3.838265138283902e-06, "loss": 1.0927, "step": 11306 }, { "epoch": 0.34, "learning_rate": 3.838059102852385e-06, "loss": 1.0902, "step": 11307 }, { "epoch": 0.34, "learning_rate": 3.837853054683191e-06, "loss": 1.1725, "step": 11308 }, { "epoch": 0.34, "learning_rate": 3.837646993778279e-06, "loss": 1.0939, "step": 11309 }, { "epoch": 0.34, "learning_rate": 3.837440920139612e-06, "loss": 1.0936, "step": 11310 }, { "epoch": 0.34, "learning_rate": 3.837234833769152e-06, "loss": 1.1382, "step": 11311 }, { "epoch": 0.34, "learning_rate": 3.83702873466886e-06, "loss": 1.1135, "step": 11312 }, { "epoch": 0.34, "learning_rate": 3.836822622840698e-06, "loss": 1.2263, "step": 11313 }, { "epoch": 0.34, "learning_rate": 3.83661649828663e-06, "loss": 1.1556, "step": 11314 }, { "epoch": 0.34, "learning_rate": 3.836410361008616e-06, "loss": 1.1937, "step": 11315 }, { "epoch": 0.34, "learning_rate": 3.836204211008619e-06, "loss": 1.1068, "step": 11316 }, { "epoch": 0.34, "learning_rate": 3.835998048288601e-06, "loss": 1.1071, "step": 11317 }, { "epoch": 0.34, "learning_rate": 3.835791872850525e-06, "loss": 1.2205, "step": 11318 }, { "epoch": 0.34, "learning_rate": 3.835585684696355e-06, "loss": 1.2443, "step": 11319 }, { "epoch": 0.34, "learning_rate": 3.835379483828051e-06, "loss": 1.2811, "step": 11320 }, { "epoch": 0.34, "learning_rate": 3.835173270247578e-06, "loss": 1.1091, "step": 11321 }, { "epoch": 0.34, "learning_rate": 3.834967043956898e-06, "loss": 1.2241, "step": 11322 }, { "epoch": 0.34, "learning_rate": 3.8347608049579754e-06, "loss": 1.1158, "step": 11323 }, { "epoch": 0.34, "learning_rate": 3.834554553252773e-06, "loss": 1.1382, "step": 11324 }, { "epoch": 0.34, "learning_rate": 3.834348288843252e-06, "loss": 1.1914, "step": 11325 }, { "epoch": 0.34, "learning_rate": 3.834142011731381e-06, "loss": 1.1285, "step": 11326 }, { "epoch": 0.34, "learning_rate": 3.833935721919119e-06, "loss": 1.1374, "step": 11327 }, { "epoch": 0.34, "learning_rate": 3.83372941940843e-06, "loss": 1.1534, "step": 11328 }, { "epoch": 0.34, "learning_rate": 3.833523104201282e-06, "loss": 1.1641, "step": 11329 }, { "epoch": 0.34, "learning_rate": 3.833316776299635e-06, "loss": 1.2583, "step": 11330 }, { "epoch": 0.34, "learning_rate": 3.833110435705454e-06, "loss": 1.0554, "step": 11331 }, { "epoch": 0.34, "learning_rate": 3.832904082420704e-06, "loss": 1.1052, "step": 11332 }, { "epoch": 0.34, "learning_rate": 3.83269771644735e-06, "loss": 1.0876, "step": 11333 }, { "epoch": 0.34, "learning_rate": 3.832491337787355e-06, "loss": 1.1328, "step": 11334 }, { "epoch": 0.34, "learning_rate": 3.832284946442684e-06, "loss": 1.2404, "step": 11335 }, { "epoch": 0.34, "learning_rate": 3.8320785424153015e-06, "loss": 1.2032, "step": 11336 }, { "epoch": 0.34, "learning_rate": 3.8318721257071735e-06, "loss": 1.2103, "step": 11337 }, { "epoch": 0.34, "learning_rate": 3.831665696320265e-06, "loss": 1.0918, "step": 11338 }, { "epoch": 0.34, "learning_rate": 3.831459254256539e-06, "loss": 1.2373, "step": 11339 }, { "epoch": 0.34, "learning_rate": 3.831252799517963e-06, "loss": 1.1406, "step": 11340 }, { "epoch": 0.34, "learning_rate": 3.8310463321065e-06, "loss": 1.1432, "step": 11341 }, { "epoch": 0.34, "learning_rate": 3.830839852024118e-06, "loss": 1.0778, "step": 11342 }, { "epoch": 0.34, "learning_rate": 3.8306333592727825e-06, "loss": 1.1412, "step": 11343 }, { "epoch": 0.34, "learning_rate": 3.830426853854458e-06, "loss": 1.1668, "step": 11344 }, { "epoch": 0.34, "learning_rate": 3.83022033577111e-06, "loss": 1.0898, "step": 11345 }, { "epoch": 0.34, "learning_rate": 3.830013805024705e-06, "loss": 1.1873, "step": 11346 }, { "epoch": 0.34, "learning_rate": 3.829807261617209e-06, "loss": 1.0211, "step": 11347 }, { "epoch": 0.34, "learning_rate": 3.829600705550589e-06, "loss": 1.1703, "step": 11348 }, { "epoch": 0.34, "learning_rate": 3.829394136826811e-06, "loss": 1.2041, "step": 11349 }, { "epoch": 0.34, "learning_rate": 3.829187555447839e-06, "loss": 1.2205, "step": 11350 }, { "epoch": 0.34, "learning_rate": 3.828980961415643e-06, "loss": 1.2059, "step": 11351 }, { "epoch": 0.34, "learning_rate": 3.8287743547321884e-06, "loss": 1.1609, "step": 11352 }, { "epoch": 0.34, "learning_rate": 3.8285677353994426e-06, "loss": 1.1196, "step": 11353 }, { "epoch": 0.34, "learning_rate": 3.82836110341937e-06, "loss": 1.254, "step": 11354 }, { "epoch": 0.34, "learning_rate": 3.8281544587939416e-06, "loss": 1.1479, "step": 11355 }, { "epoch": 0.34, "learning_rate": 3.82794780152512e-06, "loss": 1.1364, "step": 11356 }, { "epoch": 0.34, "learning_rate": 3.827741131614877e-06, "loss": 1.166, "step": 11357 }, { "epoch": 0.34, "learning_rate": 3.827534449065177e-06, "loss": 1.1552, "step": 11358 }, { "epoch": 0.34, "learning_rate": 3.8273277538779886e-06, "loss": 0.9754, "step": 11359 }, { "epoch": 0.34, "learning_rate": 3.827121046055279e-06, "loss": 1.0603, "step": 11360 }, { "epoch": 0.34, "learning_rate": 3.826914325599017e-06, "loss": 1.1854, "step": 11361 }, { "epoch": 0.34, "learning_rate": 3.826707592511169e-06, "loss": 1.1102, "step": 11362 }, { "epoch": 0.34, "learning_rate": 3.826500846793703e-06, "loss": 1.204, "step": 11363 }, { "epoch": 0.34, "learning_rate": 3.8262940884485885e-06, "loss": 1.1079, "step": 11364 }, { "epoch": 0.34, "learning_rate": 3.826087317477794e-06, "loss": 1.2416, "step": 11365 }, { "epoch": 0.34, "learning_rate": 3.825880533883285e-06, "loss": 1.1062, "step": 11366 }, { "epoch": 0.34, "learning_rate": 3.825673737667033e-06, "loss": 1.0864, "step": 11367 }, { "epoch": 0.34, "learning_rate": 3.825466928831006e-06, "loss": 1.1881, "step": 11368 }, { "epoch": 0.34, "learning_rate": 3.825260107377171e-06, "loss": 1.1849, "step": 11369 }, { "epoch": 0.34, "learning_rate": 3.825053273307499e-06, "loss": 1.1663, "step": 11370 }, { "epoch": 0.34, "learning_rate": 3.824846426623957e-06, "loss": 1.1207, "step": 11371 }, { "epoch": 0.34, "learning_rate": 3.824639567328516e-06, "loss": 1.1537, "step": 11372 }, { "epoch": 0.34, "learning_rate": 3.824432695423144e-06, "loss": 1.048, "step": 11373 }, { "epoch": 0.34, "learning_rate": 3.824225810909811e-06, "loss": 1.1934, "step": 11374 }, { "epoch": 0.34, "learning_rate": 3.824018913790485e-06, "loss": 1.0866, "step": 11375 }, { "epoch": 0.34, "learning_rate": 3.823812004067136e-06, "loss": 1.0991, "step": 11376 }, { "epoch": 0.34, "learning_rate": 3.823605081741737e-06, "loss": 1.1998, "step": 11377 }, { "epoch": 0.34, "learning_rate": 3.823398146816253e-06, "loss": 1.1817, "step": 11378 }, { "epoch": 0.34, "learning_rate": 3.8231911992926575e-06, "loss": 1.2981, "step": 11379 }, { "epoch": 0.34, "learning_rate": 3.822984239172917e-06, "loss": 1.1509, "step": 11380 }, { "epoch": 0.34, "learning_rate": 3.822777266459006e-06, "loss": 1.2178, "step": 11381 }, { "epoch": 0.34, "learning_rate": 3.822570281152891e-06, "loss": 1.1038, "step": 11382 }, { "epoch": 0.34, "learning_rate": 3.822363283256544e-06, "loss": 1.0583, "step": 11383 }, { "epoch": 0.34, "learning_rate": 3.822156272771935e-06, "loss": 1.1221, "step": 11384 }, { "epoch": 0.34, "learning_rate": 3.821949249701037e-06, "loss": 1.1196, "step": 11385 }, { "epoch": 0.34, "learning_rate": 3.821742214045817e-06, "loss": 1.1716, "step": 11386 }, { "epoch": 0.34, "learning_rate": 3.821535165808249e-06, "loss": 1.1551, "step": 11387 }, { "epoch": 0.34, "learning_rate": 3.821328104990301e-06, "loss": 1.1602, "step": 11388 }, { "epoch": 0.34, "learning_rate": 3.821121031593947e-06, "loss": 1.0604, "step": 11389 }, { "epoch": 0.34, "learning_rate": 3.8209139456211566e-06, "loss": 1.0154, "step": 11390 }, { "epoch": 0.34, "learning_rate": 3.8207068470739016e-06, "loss": 1.1691, "step": 11391 }, { "epoch": 0.34, "learning_rate": 3.820499735954154e-06, "loss": 1.1146, "step": 11392 }, { "epoch": 0.34, "learning_rate": 3.820292612263885e-06, "loss": 1.246, "step": 11393 }, { "epoch": 0.34, "learning_rate": 3.820085476005066e-06, "loss": 1.0847, "step": 11394 }, { "epoch": 0.34, "learning_rate": 3.819878327179668e-06, "loss": 1.2289, "step": 11395 }, { "epoch": 0.34, "learning_rate": 3.8196711657896655e-06, "loss": 1.0496, "step": 11396 }, { "epoch": 0.34, "learning_rate": 3.819463991837028e-06, "loss": 1.226, "step": 11397 }, { "epoch": 0.34, "learning_rate": 3.819256805323729e-06, "loss": 1.2891, "step": 11398 }, { "epoch": 0.34, "learning_rate": 3.8190496062517415e-06, "loss": 1.1743, "step": 11399 }, { "epoch": 0.34, "learning_rate": 3.818842394623036e-06, "loss": 1.1342, "step": 11400 }, { "epoch": 0.34, "learning_rate": 3.818635170439586e-06, "loss": 1.2535, "step": 11401 }, { "epoch": 0.34, "learning_rate": 3.8184279337033645e-06, "loss": 1.0726, "step": 11402 }, { "epoch": 0.34, "learning_rate": 3.818220684416345e-06, "loss": 1.0346, "step": 11403 }, { "epoch": 0.34, "learning_rate": 3.818013422580499e-06, "loss": 1.1307, "step": 11404 }, { "epoch": 0.34, "learning_rate": 3.817806148197799e-06, "loss": 1.2748, "step": 11405 }, { "epoch": 0.34, "learning_rate": 3.81759886127022e-06, "loss": 1.1802, "step": 11406 }, { "epoch": 0.34, "learning_rate": 3.817391561799734e-06, "loss": 1.0868, "step": 11407 }, { "epoch": 0.34, "learning_rate": 3.8171842497883145e-06, "loss": 1.2188, "step": 11408 }, { "epoch": 0.34, "learning_rate": 3.816976925237936e-06, "loss": 1.062, "step": 11409 }, { "epoch": 0.34, "learning_rate": 3.816769588150572e-06, "loss": 1.2269, "step": 11410 }, { "epoch": 0.34, "learning_rate": 3.816562238528195e-06, "loss": 1.1703, "step": 11411 }, { "epoch": 0.34, "learning_rate": 3.816354876372779e-06, "loss": 1.1719, "step": 11412 }, { "epoch": 0.34, "learning_rate": 3.8161475016863e-06, "loss": 1.1825, "step": 11413 }, { "epoch": 0.34, "learning_rate": 3.815940114470729e-06, "loss": 1.0801, "step": 11414 }, { "epoch": 0.34, "learning_rate": 3.815732714728042e-06, "loss": 1.0789, "step": 11415 }, { "epoch": 0.34, "learning_rate": 3.815525302460215e-06, "loss": 1.0328, "step": 11416 }, { "epoch": 0.34, "learning_rate": 3.815317877669219e-06, "loss": 1.2045, "step": 11417 }, { "epoch": 0.34, "learning_rate": 3.815110440357032e-06, "loss": 1.103, "step": 11418 }, { "epoch": 0.34, "learning_rate": 3.814902990525625e-06, "loss": 1.0906, "step": 11419 }, { "epoch": 0.34, "learning_rate": 3.814695528176976e-06, "loss": 1.1469, "step": 11420 }, { "epoch": 0.34, "learning_rate": 3.8144880533130585e-06, "loss": 1.1471, "step": 11421 }, { "epoch": 0.34, "learning_rate": 3.814280565935847e-06, "loss": 1.0906, "step": 11422 }, { "epoch": 0.34, "learning_rate": 3.8140730660473186e-06, "loss": 1.0963, "step": 11423 }, { "epoch": 0.34, "learning_rate": 3.813865553649447e-06, "loss": 1.2418, "step": 11424 }, { "epoch": 0.34, "learning_rate": 3.813658028744208e-06, "loss": 1.071, "step": 11425 }, { "epoch": 0.34, "learning_rate": 3.8134504913335777e-06, "loss": 1.2438, "step": 11426 }, { "epoch": 0.34, "learning_rate": 3.8132429414195316e-06, "loss": 1.1471, "step": 11427 }, { "epoch": 0.34, "learning_rate": 3.813035379004044e-06, "loss": 1.18, "step": 11428 }, { "epoch": 0.34, "learning_rate": 3.8128278040890933e-06, "loss": 1.0852, "step": 11429 }, { "epoch": 0.34, "learning_rate": 3.8126202166766533e-06, "loss": 1.246, "step": 11430 }, { "epoch": 0.34, "learning_rate": 3.8124126167687016e-06, "loss": 1.0334, "step": 11431 }, { "epoch": 0.34, "learning_rate": 3.8122050043672134e-06, "loss": 1.1552, "step": 11432 }, { "epoch": 0.34, "learning_rate": 3.811997379474166e-06, "loss": 1.134, "step": 11433 }, { "epoch": 0.34, "learning_rate": 3.8117897420915345e-06, "loss": 1.0954, "step": 11434 }, { "epoch": 0.34, "learning_rate": 3.811582092221297e-06, "loss": 1.1829, "step": 11435 }, { "epoch": 0.34, "learning_rate": 3.81137442986543e-06, "loss": 1.1862, "step": 11436 }, { "epoch": 0.34, "learning_rate": 3.811166755025909e-06, "loss": 1.2681, "step": 11437 }, { "epoch": 0.34, "learning_rate": 3.8109590677047126e-06, "loss": 0.9451, "step": 11438 }, { "epoch": 0.34, "learning_rate": 3.810751367903818e-06, "loss": 1.202, "step": 11439 }, { "epoch": 0.34, "learning_rate": 3.8105436556252008e-06, "loss": 1.1324, "step": 11440 }, { "epoch": 0.34, "learning_rate": 3.8103359308708395e-06, "loss": 1.0298, "step": 11441 }, { "epoch": 0.34, "learning_rate": 3.810128193642711e-06, "loss": 1.05, "step": 11442 }, { "epoch": 0.34, "learning_rate": 3.809920443942793e-06, "loss": 1.1652, "step": 11443 }, { "epoch": 0.34, "learning_rate": 3.8097126817730635e-06, "loss": 1.113, "step": 11444 }, { "epoch": 0.34, "learning_rate": 3.8095049071354997e-06, "loss": 1.3311, "step": 11445 }, { "epoch": 0.34, "learning_rate": 3.8092971200320803e-06, "loss": 1.1134, "step": 11446 }, { "epoch": 0.34, "learning_rate": 3.809089320464783e-06, "loss": 1.0762, "step": 11447 }, { "epoch": 0.34, "learning_rate": 3.8088815084355845e-06, "loss": 1.1506, "step": 11448 }, { "epoch": 0.34, "learning_rate": 3.8086736839464657e-06, "loss": 1.0865, "step": 11449 }, { "epoch": 0.34, "learning_rate": 3.808465846999404e-06, "loss": 1.1038, "step": 11450 }, { "epoch": 0.34, "learning_rate": 3.8082579975963764e-06, "loss": 1.1733, "step": 11451 }, { "epoch": 0.34, "learning_rate": 3.808050135739364e-06, "loss": 1.2559, "step": 11452 }, { "epoch": 0.35, "learning_rate": 3.8078422614303432e-06, "loss": 1.1047, "step": 11453 }, { "epoch": 0.35, "learning_rate": 3.8076343746712954e-06, "loss": 1.1373, "step": 11454 }, { "epoch": 0.35, "learning_rate": 3.8074264754641967e-06, "loss": 1.1487, "step": 11455 }, { "epoch": 0.35, "learning_rate": 3.8072185638110284e-06, "loss": 1.1046, "step": 11456 }, { "epoch": 0.35, "learning_rate": 3.8070106397137687e-06, "loss": 1.1274, "step": 11457 }, { "epoch": 0.35, "learning_rate": 3.806802703174397e-06, "loss": 1.0967, "step": 11458 }, { "epoch": 0.35, "learning_rate": 3.8065947541948933e-06, "loss": 1.1275, "step": 11459 }, { "epoch": 0.35, "learning_rate": 3.806386792777236e-06, "loss": 1.0096, "step": 11460 }, { "epoch": 0.35, "learning_rate": 3.8061788189234066e-06, "loss": 1.0679, "step": 11461 }, { "epoch": 0.35, "learning_rate": 3.8059708326353833e-06, "loss": 1.1205, "step": 11462 }, { "epoch": 0.35, "learning_rate": 3.805762833915147e-06, "loss": 1.2109, "step": 11463 }, { "epoch": 0.35, "learning_rate": 3.805554822764677e-06, "loss": 1.1859, "step": 11464 }, { "epoch": 0.35, "learning_rate": 3.8053467991859545e-06, "loss": 1.0886, "step": 11465 }, { "epoch": 0.35, "learning_rate": 3.8051387631809587e-06, "loss": 1.0616, "step": 11466 }, { "epoch": 0.35, "learning_rate": 3.8049307147516706e-06, "loss": 1.1133, "step": 11467 }, { "epoch": 0.35, "learning_rate": 3.8047226539000704e-06, "loss": 1.2358, "step": 11468 }, { "epoch": 0.35, "learning_rate": 3.804514580628139e-06, "loss": 1.3397, "step": 11469 }, { "epoch": 0.35, "learning_rate": 3.804306494937857e-06, "loss": 1.0816, "step": 11470 }, { "epoch": 0.35, "learning_rate": 3.8040983968312055e-06, "loss": 1.1488, "step": 11471 }, { "epoch": 0.35, "learning_rate": 3.8038902863101655e-06, "loss": 1.0485, "step": 11472 }, { "epoch": 0.35, "learning_rate": 3.8036821633767174e-06, "loss": 1.1935, "step": 11473 }, { "epoch": 0.35, "learning_rate": 3.803474028032844e-06, "loss": 1.15, "step": 11474 }, { "epoch": 0.35, "learning_rate": 3.8032658802805246e-06, "loss": 1.1705, "step": 11475 }, { "epoch": 0.35, "learning_rate": 3.8030577201217424e-06, "loss": 1.1174, "step": 11476 }, { "epoch": 0.35, "learning_rate": 3.802849547558477e-06, "loss": 1.0398, "step": 11477 }, { "epoch": 0.35, "learning_rate": 3.8026413625927127e-06, "loss": 1.1444, "step": 11478 }, { "epoch": 0.35, "learning_rate": 3.8024331652264294e-06, "loss": 1.1948, "step": 11479 }, { "epoch": 0.35, "learning_rate": 3.8022249554616103e-06, "loss": 1.1248, "step": 11480 }, { "epoch": 0.35, "learning_rate": 3.802016733300236e-06, "loss": 1.2236, "step": 11481 }, { "epoch": 0.35, "learning_rate": 3.80180849874429e-06, "loss": 1.1448, "step": 11482 }, { "epoch": 0.35, "learning_rate": 3.801600251795754e-06, "loss": 1.1776, "step": 11483 }, { "epoch": 0.35, "learning_rate": 3.80139199245661e-06, "loss": 1.1823, "step": 11484 }, { "epoch": 0.35, "learning_rate": 3.8011837207288417e-06, "loss": 1.1415, "step": 11485 }, { "epoch": 0.35, "learning_rate": 3.800975436614431e-06, "loss": 1.134, "step": 11486 }, { "epoch": 0.35, "learning_rate": 3.80076714011536e-06, "loss": 1.1943, "step": 11487 }, { "epoch": 0.35, "learning_rate": 3.800558831233613e-06, "loss": 1.0865, "step": 11488 }, { "epoch": 0.35, "learning_rate": 3.800350509971172e-06, "loss": 1.0847, "step": 11489 }, { "epoch": 0.35, "learning_rate": 3.80014217633002e-06, "loss": 1.0273, "step": 11490 }, { "epoch": 0.35, "learning_rate": 3.7999338303121413e-06, "loss": 1.2169, "step": 11491 }, { "epoch": 0.35, "learning_rate": 3.7997254719195186e-06, "loss": 1.0132, "step": 11492 }, { "epoch": 0.35, "learning_rate": 3.7995171011541353e-06, "loss": 1.1223, "step": 11493 }, { "epoch": 0.35, "learning_rate": 3.7993087180179743e-06, "loss": 1.1423, "step": 11494 }, { "epoch": 0.35, "learning_rate": 3.7991003225130206e-06, "loss": 1.0707, "step": 11495 }, { "epoch": 0.35, "learning_rate": 3.7988919146412584e-06, "loss": 1.1282, "step": 11496 }, { "epoch": 0.35, "learning_rate": 3.798683494404669e-06, "loss": 1.0237, "step": 11497 }, { "epoch": 0.35, "learning_rate": 3.79847506180524e-06, "loss": 1.1532, "step": 11498 }, { "epoch": 0.35, "learning_rate": 3.7982666168449528e-06, "loss": 1.1275, "step": 11499 }, { "epoch": 0.35, "learning_rate": 3.798058159525793e-06, "loss": 1.0451, "step": 11500 }, { "epoch": 0.35, "learning_rate": 3.7978496898497443e-06, "loss": 1.1316, "step": 11501 }, { "epoch": 0.35, "learning_rate": 3.797641207818792e-06, "loss": 1.0974, "step": 11502 }, { "epoch": 0.35, "learning_rate": 3.79743271343492e-06, "loss": 1.1494, "step": 11503 }, { "epoch": 0.35, "learning_rate": 3.797224206700113e-06, "loss": 1.1258, "step": 11504 }, { "epoch": 0.35, "learning_rate": 3.797015687616357e-06, "loss": 1.1487, "step": 11505 }, { "epoch": 0.35, "learning_rate": 3.796807156185637e-06, "loss": 1.1003, "step": 11506 }, { "epoch": 0.35, "learning_rate": 3.7965986124099362e-06, "loss": 1.043, "step": 11507 }, { "epoch": 0.35, "learning_rate": 3.7963900562912414e-06, "loss": 1.1001, "step": 11508 }, { "epoch": 0.35, "learning_rate": 3.7961814878315382e-06, "loss": 1.0365, "step": 11509 }, { "epoch": 0.35, "learning_rate": 3.795972907032811e-06, "loss": 1.1608, "step": 11510 }, { "epoch": 0.35, "learning_rate": 3.7957643138970458e-06, "loss": 1.1598, "step": 11511 }, { "epoch": 0.35, "learning_rate": 3.7955557084262286e-06, "loss": 1.1849, "step": 11512 }, { "epoch": 0.35, "learning_rate": 3.7953470906223454e-06, "loss": 1.1354, "step": 11513 }, { "epoch": 0.35, "learning_rate": 3.7951384604873807e-06, "loss": 1.1715, "step": 11514 }, { "epoch": 0.35, "learning_rate": 3.794929818023323e-06, "loss": 1.1185, "step": 11515 }, { "epoch": 0.35, "learning_rate": 3.7947211632321557e-06, "loss": 1.233, "step": 11516 }, { "epoch": 0.35, "learning_rate": 3.7945124961158676e-06, "loss": 1.2098, "step": 11517 }, { "epoch": 0.35, "learning_rate": 3.7943038166764427e-06, "loss": 1.0251, "step": 11518 }, { "epoch": 0.35, "learning_rate": 3.7940951249158704e-06, "loss": 1.197, "step": 11519 }, { "epoch": 0.35, "learning_rate": 3.7938864208361347e-06, "loss": 1.1926, "step": 11520 }, { "epoch": 0.35, "learning_rate": 3.7936777044392236e-06, "loss": 1.0954, "step": 11521 }, { "epoch": 0.35, "learning_rate": 3.7934689757271236e-06, "loss": 1.0927, "step": 11522 }, { "epoch": 0.35, "learning_rate": 3.793260234701822e-06, "loss": 1.2058, "step": 11523 }, { "epoch": 0.35, "learning_rate": 3.793051481365307e-06, "loss": 1.0874, "step": 11524 }, { "epoch": 0.35, "learning_rate": 3.7928427157195634e-06, "loss": 1.227, "step": 11525 }, { "epoch": 0.35, "learning_rate": 3.7926339377665806e-06, "loss": 1.1355, "step": 11526 }, { "epoch": 0.35, "learning_rate": 3.7924251475083444e-06, "loss": 1.1678, "step": 11527 }, { "epoch": 0.35, "learning_rate": 3.7922163449468442e-06, "loss": 1.1815, "step": 11528 }, { "epoch": 0.35, "learning_rate": 3.7920075300840658e-06, "loss": 1.1586, "step": 11529 }, { "epoch": 0.35, "learning_rate": 3.7917987029219983e-06, "loss": 1.2297, "step": 11530 }, { "epoch": 0.35, "learning_rate": 3.791589863462629e-06, "loss": 1.1122, "step": 11531 }, { "epoch": 0.35, "learning_rate": 3.791381011707947e-06, "loss": 1.1852, "step": 11532 }, { "epoch": 0.35, "learning_rate": 3.7911721476599396e-06, "loss": 1.1077, "step": 11533 }, { "epoch": 0.35, "learning_rate": 3.7909632713205944e-06, "loss": 1.1136, "step": 11534 }, { "epoch": 0.35, "learning_rate": 3.7907543826919015e-06, "loss": 1.0233, "step": 11535 }, { "epoch": 0.35, "learning_rate": 3.790545481775848e-06, "loss": 1.2828, "step": 11536 }, { "epoch": 0.35, "learning_rate": 3.790336568574423e-06, "loss": 1.1852, "step": 11537 }, { "epoch": 0.35, "learning_rate": 3.7901276430896156e-06, "loss": 1.0674, "step": 11538 }, { "epoch": 0.35, "learning_rate": 3.7899187053234144e-06, "loss": 1.0966, "step": 11539 }, { "epoch": 0.35, "learning_rate": 3.7897097552778084e-06, "loss": 1.1422, "step": 11540 }, { "epoch": 0.35, "learning_rate": 3.7895007929547868e-06, "loss": 1.1657, "step": 11541 }, { "epoch": 0.35, "learning_rate": 3.7892918183563388e-06, "loss": 1.0937, "step": 11542 }, { "epoch": 0.35, "learning_rate": 3.789082831484453e-06, "loss": 1.0333, "step": 11543 }, { "epoch": 0.35, "learning_rate": 3.78887383234112e-06, "loss": 1.1923, "step": 11544 }, { "epoch": 0.35, "learning_rate": 3.7886648209283283e-06, "loss": 1.127, "step": 11545 }, { "epoch": 0.35, "learning_rate": 3.7884557972480683e-06, "loss": 0.9929, "step": 11546 }, { "epoch": 0.35, "learning_rate": 3.78824676130233e-06, "loss": 1.0187, "step": 11547 }, { "epoch": 0.35, "learning_rate": 3.7880377130931028e-06, "loss": 1.2426, "step": 11548 }, { "epoch": 0.35, "learning_rate": 3.7878286526223767e-06, "loss": 1.2594, "step": 11549 }, { "epoch": 0.35, "learning_rate": 3.787619579892142e-06, "loss": 1.2211, "step": 11550 }, { "epoch": 0.35, "learning_rate": 3.78741049490439e-06, "loss": 1.1074, "step": 11551 }, { "epoch": 0.35, "learning_rate": 3.7872013976611094e-06, "loss": 1.0857, "step": 11552 }, { "epoch": 0.35, "learning_rate": 3.7869922881642917e-06, "loss": 1.103, "step": 11553 }, { "epoch": 0.35, "learning_rate": 3.786783166415927e-06, "loss": 1.1523, "step": 11554 }, { "epoch": 0.35, "learning_rate": 3.7865740324180062e-06, "loss": 1.1348, "step": 11555 }, { "epoch": 0.35, "learning_rate": 3.786364886172521e-06, "loss": 1.2645, "step": 11556 }, { "epoch": 0.35, "learning_rate": 3.7861557276814607e-06, "loss": 1.2441, "step": 11557 }, { "epoch": 0.35, "learning_rate": 3.785946556946817e-06, "loss": 1.1086, "step": 11558 }, { "epoch": 0.35, "learning_rate": 3.785737373970582e-06, "loss": 1.0829, "step": 11559 }, { "epoch": 0.35, "learning_rate": 3.785528178754747e-06, "loss": 1.1699, "step": 11560 }, { "epoch": 0.35, "learning_rate": 3.7853189713013018e-06, "loss": 1.1588, "step": 11561 }, { "epoch": 0.35, "learning_rate": 3.785109751612239e-06, "loss": 1.1716, "step": 11562 }, { "epoch": 0.35, "learning_rate": 3.7849005196895516e-06, "loss": 1.1131, "step": 11563 }, { "epoch": 0.35, "learning_rate": 3.7846912755352293e-06, "loss": 1.1068, "step": 11564 }, { "epoch": 0.35, "learning_rate": 3.784482019151265e-06, "loss": 1.032, "step": 11565 }, { "epoch": 0.35, "learning_rate": 3.7842727505396506e-06, "loss": 1.1832, "step": 11566 }, { "epoch": 0.35, "learning_rate": 3.7840634697023778e-06, "loss": 1.1459, "step": 11567 }, { "epoch": 0.35, "learning_rate": 3.7838541766414387e-06, "loss": 1.1866, "step": 11568 }, { "epoch": 0.35, "learning_rate": 3.7836448713588268e-06, "loss": 1.0855, "step": 11569 }, { "epoch": 0.35, "learning_rate": 3.7834355538565343e-06, "loss": 1.1551, "step": 11570 }, { "epoch": 0.35, "learning_rate": 3.7832262241365526e-06, "loss": 1.1229, "step": 11571 }, { "epoch": 0.35, "learning_rate": 3.7830168822008756e-06, "loss": 1.1301, "step": 11572 }, { "epoch": 0.35, "learning_rate": 3.7828075280514964e-06, "loss": 1.173, "step": 11573 }, { "epoch": 0.35, "learning_rate": 3.782598161690406e-06, "loss": 1.3577, "step": 11574 }, { "epoch": 0.35, "learning_rate": 3.7823887831196e-06, "loss": 1.0618, "step": 11575 }, { "epoch": 0.35, "learning_rate": 3.78217939234107e-06, "loss": 1.0595, "step": 11576 }, { "epoch": 0.35, "learning_rate": 3.7819699893568095e-06, "loss": 1.1329, "step": 11577 }, { "epoch": 0.35, "learning_rate": 3.7817605741688135e-06, "loss": 1.1906, "step": 11578 }, { "epoch": 0.35, "learning_rate": 3.781551146779072e-06, "loss": 1.1638, "step": 11579 }, { "epoch": 0.35, "learning_rate": 3.7813417071895824e-06, "loss": 1.2184, "step": 11580 }, { "epoch": 0.35, "learning_rate": 3.7811322554023367e-06, "loss": 1.2156, "step": 11581 }, { "epoch": 0.35, "learning_rate": 3.780922791419328e-06, "loss": 1.119, "step": 11582 }, { "epoch": 0.35, "learning_rate": 3.7807133152425523e-06, "loss": 1.1309, "step": 11583 }, { "epoch": 0.35, "learning_rate": 3.7805038268740022e-06, "loss": 1.1072, "step": 11584 }, { "epoch": 0.35, "learning_rate": 3.7802943263156722e-06, "loss": 1.248, "step": 11585 }, { "epoch": 0.35, "learning_rate": 3.7800848135695567e-06, "loss": 1.1584, "step": 11586 }, { "epoch": 0.35, "learning_rate": 3.77987528863765e-06, "loss": 1.2812, "step": 11587 }, { "epoch": 0.35, "learning_rate": 3.7796657515219476e-06, "loss": 1.095, "step": 11588 }, { "epoch": 0.35, "learning_rate": 3.779456202224444e-06, "loss": 1.1165, "step": 11589 }, { "epoch": 0.35, "learning_rate": 3.779246640747133e-06, "loss": 1.1254, "step": 11590 }, { "epoch": 0.35, "learning_rate": 3.7790370670920094e-06, "loss": 1.0404, "step": 11591 }, { "epoch": 0.35, "learning_rate": 3.77882748126107e-06, "loss": 1.1212, "step": 11592 }, { "epoch": 0.35, "learning_rate": 3.778617883256309e-06, "loss": 1.2705, "step": 11593 }, { "epoch": 0.35, "learning_rate": 3.7784082730797206e-06, "loss": 0.9623, "step": 11594 }, { "epoch": 0.35, "learning_rate": 3.778198650733302e-06, "loss": 1.0903, "step": 11595 }, { "epoch": 0.35, "learning_rate": 3.777989016219047e-06, "loss": 1.1144, "step": 11596 }, { "epoch": 0.35, "learning_rate": 3.777779369538953e-06, "loss": 1.1439, "step": 11597 }, { "epoch": 0.35, "learning_rate": 3.777569710695014e-06, "loss": 1.066, "step": 11598 }, { "epoch": 0.35, "learning_rate": 3.777360039689227e-06, "loss": 1.1967, "step": 11599 }, { "epoch": 0.35, "learning_rate": 3.7771503565235874e-06, "loss": 1.3215, "step": 11600 }, { "epoch": 0.35, "learning_rate": 3.7769406612000914e-06, "loss": 1.0692, "step": 11601 }, { "epoch": 0.35, "learning_rate": 3.776730953720736e-06, "loss": 1.1158, "step": 11602 }, { "epoch": 0.35, "learning_rate": 3.776521234087516e-06, "loss": 1.1293, "step": 11603 }, { "epoch": 0.35, "learning_rate": 3.7763115023024295e-06, "loss": 1.1824, "step": 11604 }, { "epoch": 0.35, "learning_rate": 3.776101758367472e-06, "loss": 1.027, "step": 11605 }, { "epoch": 0.35, "learning_rate": 3.77589200228464e-06, "loss": 1.1016, "step": 11606 }, { "epoch": 0.35, "learning_rate": 3.7756822340559307e-06, "loss": 1.1327, "step": 11607 }, { "epoch": 0.35, "learning_rate": 3.775472453683341e-06, "loss": 1.1802, "step": 11608 }, { "epoch": 0.35, "learning_rate": 3.7752626611688675e-06, "loss": 1.0864, "step": 11609 }, { "epoch": 0.35, "learning_rate": 3.7750528565145083e-06, "loss": 1.262, "step": 11610 }, { "epoch": 0.35, "learning_rate": 3.7748430397222593e-06, "loss": 1.1107, "step": 11611 }, { "epoch": 0.35, "learning_rate": 3.7746332107941186e-06, "loss": 1.183, "step": 11612 }, { "epoch": 0.35, "learning_rate": 3.7744233697320844e-06, "loss": 1.176, "step": 11613 }, { "epoch": 0.35, "learning_rate": 3.7742135165381528e-06, "loss": 1.1157, "step": 11614 }, { "epoch": 0.35, "learning_rate": 3.7740036512143218e-06, "loss": 1.0992, "step": 11615 }, { "epoch": 0.35, "learning_rate": 3.773793773762591e-06, "loss": 1.1197, "step": 11616 }, { "epoch": 0.35, "learning_rate": 3.7735838841849557e-06, "loss": 1.1236, "step": 11617 }, { "epoch": 0.35, "learning_rate": 3.773373982483416e-06, "loss": 1.0708, "step": 11618 }, { "epoch": 0.35, "learning_rate": 3.773164068659969e-06, "loss": 1.1699, "step": 11619 }, { "epoch": 0.35, "learning_rate": 3.7729541427166128e-06, "loss": 1.0662, "step": 11620 }, { "epoch": 0.35, "learning_rate": 3.772744204655347e-06, "loss": 1.142, "step": 11621 }, { "epoch": 0.35, "learning_rate": 3.7725342544781686e-06, "loss": 1.1577, "step": 11622 }, { "epoch": 0.35, "learning_rate": 3.7723242921870777e-06, "loss": 1.1537, "step": 11623 }, { "epoch": 0.35, "learning_rate": 3.7721143177840717e-06, "loss": 1.1979, "step": 11624 }, { "epoch": 0.35, "learning_rate": 3.7719043312711513e-06, "loss": 1.1144, "step": 11625 }, { "epoch": 0.35, "learning_rate": 3.7716943326503125e-06, "loss": 1.0674, "step": 11626 }, { "epoch": 0.35, "learning_rate": 3.7714843219235564e-06, "loss": 1.0956, "step": 11627 }, { "epoch": 0.35, "learning_rate": 3.7712742990928825e-06, "loss": 1.0945, "step": 11628 }, { "epoch": 0.35, "learning_rate": 3.771064264160289e-06, "loss": 1.129, "step": 11629 }, { "epoch": 0.35, "learning_rate": 3.7708542171277766e-06, "loss": 1.2065, "step": 11630 }, { "epoch": 0.35, "learning_rate": 3.770644157997344e-06, "loss": 1.0896, "step": 11631 }, { "epoch": 0.35, "learning_rate": 3.770434086770991e-06, "loss": 1.0648, "step": 11632 }, { "epoch": 0.35, "learning_rate": 3.770224003450717e-06, "loss": 1.1597, "step": 11633 }, { "epoch": 0.35, "learning_rate": 3.770013908038522e-06, "loss": 1.1068, "step": 11634 }, { "epoch": 0.35, "learning_rate": 3.769803800536407e-06, "loss": 1.1386, "step": 11635 }, { "epoch": 0.35, "learning_rate": 3.769593680946372e-06, "loss": 1.212, "step": 11636 }, { "epoch": 0.35, "learning_rate": 3.769383549270415e-06, "loss": 1.1442, "step": 11637 }, { "epoch": 0.35, "learning_rate": 3.7691734055105388e-06, "loss": 1.0707, "step": 11638 }, { "epoch": 0.35, "learning_rate": 3.768963249668743e-06, "loss": 1.0565, "step": 11639 }, { "epoch": 0.35, "learning_rate": 3.7687530817470273e-06, "loss": 1.0045, "step": 11640 }, { "epoch": 0.35, "learning_rate": 3.768542901747394e-06, "loss": 1.0876, "step": 11641 }, { "epoch": 0.35, "learning_rate": 3.7683327096718436e-06, "loss": 1.0887, "step": 11642 }, { "epoch": 0.35, "learning_rate": 3.7681225055223764e-06, "loss": 1.1109, "step": 11643 }, { "epoch": 0.35, "learning_rate": 3.7679122893009935e-06, "loss": 1.2625, "step": 11644 }, { "epoch": 0.35, "learning_rate": 3.767702061009697e-06, "loss": 1.1012, "step": 11645 }, { "epoch": 0.35, "learning_rate": 3.767491820650486e-06, "loss": 1.1201, "step": 11646 }, { "epoch": 0.35, "learning_rate": 3.767281568225365e-06, "loss": 1.1528, "step": 11647 }, { "epoch": 0.35, "learning_rate": 3.7670713037363326e-06, "loss": 1.1953, "step": 11648 }, { "epoch": 0.35, "learning_rate": 3.7668610271853923e-06, "loss": 1.1407, "step": 11649 }, { "epoch": 0.35, "learning_rate": 3.7666507385745442e-06, "loss": 1.1937, "step": 11650 }, { "epoch": 0.35, "learning_rate": 3.766440437905793e-06, "loss": 1.0328, "step": 11651 }, { "epoch": 0.35, "learning_rate": 3.7662301251811367e-06, "loss": 1.2462, "step": 11652 }, { "epoch": 0.35, "learning_rate": 3.7660198004025806e-06, "loss": 1.033, "step": 11653 }, { "epoch": 0.35, "learning_rate": 3.7658094635721247e-06, "loss": 1.1545, "step": 11654 }, { "epoch": 0.35, "learning_rate": 3.7655991146917735e-06, "loss": 1.064, "step": 11655 }, { "epoch": 0.35, "learning_rate": 3.7653887537635275e-06, "loss": 1.0629, "step": 11656 }, { "epoch": 0.35, "learning_rate": 3.7651783807893906e-06, "loss": 1.1277, "step": 11657 }, { "epoch": 0.35, "learning_rate": 3.7649679957713645e-06, "loss": 1.1581, "step": 11658 }, { "epoch": 0.35, "learning_rate": 3.7647575987114523e-06, "loss": 1.1296, "step": 11659 }, { "epoch": 0.35, "learning_rate": 3.764547189611657e-06, "loss": 1.0889, "step": 11660 }, { "epoch": 0.35, "learning_rate": 3.764336768473982e-06, "loss": 1.1626, "step": 11661 }, { "epoch": 0.35, "learning_rate": 3.7641263353004286e-06, "loss": 1.0992, "step": 11662 }, { "epoch": 0.35, "learning_rate": 3.7639158900930024e-06, "loss": 1.1335, "step": 11663 }, { "epoch": 0.35, "learning_rate": 3.7637054328537053e-06, "loss": 1.2161, "step": 11664 }, { "epoch": 0.35, "learning_rate": 3.763494963584541e-06, "loss": 1.1268, "step": 11665 }, { "epoch": 0.35, "learning_rate": 3.7632844822875138e-06, "loss": 1.1375, "step": 11666 }, { "epoch": 0.35, "learning_rate": 3.7630739889646262e-06, "loss": 1.1046, "step": 11667 }, { "epoch": 0.35, "learning_rate": 3.7628634836178824e-06, "loss": 1.0972, "step": 11668 }, { "epoch": 0.35, "learning_rate": 3.7626529662492863e-06, "loss": 0.9966, "step": 11669 }, { "epoch": 0.35, "learning_rate": 3.762442436860842e-06, "loss": 1.1375, "step": 11670 }, { "epoch": 0.35, "learning_rate": 3.7622318954545547e-06, "loss": 1.2474, "step": 11671 }, { "epoch": 0.35, "learning_rate": 3.7620213420324264e-06, "loss": 1.1378, "step": 11672 }, { "epoch": 0.35, "learning_rate": 3.761810776596464e-06, "loss": 1.1408, "step": 11673 }, { "epoch": 0.35, "learning_rate": 3.7616001991486696e-06, "loss": 1.2484, "step": 11674 }, { "epoch": 0.35, "learning_rate": 3.7613896096910497e-06, "loss": 1.123, "step": 11675 }, { "epoch": 0.35, "learning_rate": 3.761179008225608e-06, "loss": 1.0927, "step": 11676 }, { "epoch": 0.35, "learning_rate": 3.7609683947543497e-06, "loss": 1.1171, "step": 11677 }, { "epoch": 0.35, "learning_rate": 3.760757769279279e-06, "loss": 1.0956, "step": 11678 }, { "epoch": 0.35, "learning_rate": 3.760547131802402e-06, "loss": 0.9976, "step": 11679 }, { "epoch": 0.35, "learning_rate": 3.7603364823257238e-06, "loss": 1.0374, "step": 11680 }, { "epoch": 0.35, "learning_rate": 3.760125820851248e-06, "loss": 1.0484, "step": 11681 }, { "epoch": 0.35, "learning_rate": 3.7599151473809825e-06, "loss": 1.0726, "step": 11682 }, { "epoch": 0.35, "learning_rate": 3.759704461916931e-06, "loss": 1.1344, "step": 11683 }, { "epoch": 0.35, "learning_rate": 3.7594937644610997e-06, "loss": 1.1495, "step": 11684 }, { "epoch": 0.35, "learning_rate": 3.7592830550154946e-06, "loss": 1.1611, "step": 11685 }, { "epoch": 0.35, "learning_rate": 3.7590723335821217e-06, "loss": 1.2042, "step": 11686 }, { "epoch": 0.35, "learning_rate": 3.758861600162986e-06, "loss": 1.1734, "step": 11687 }, { "epoch": 0.35, "learning_rate": 3.7586508547600943e-06, "loss": 1.2637, "step": 11688 }, { "epoch": 0.35, "learning_rate": 3.7584400973754524e-06, "loss": 1.26, "step": 11689 }, { "epoch": 0.35, "learning_rate": 3.7582293280110677e-06, "loss": 1.1481, "step": 11690 }, { "epoch": 0.35, "learning_rate": 3.7580185466689447e-06, "loss": 1.0762, "step": 11691 }, { "epoch": 0.35, "learning_rate": 3.7578077533510917e-06, "loss": 1.2324, "step": 11692 }, { "epoch": 0.35, "learning_rate": 3.7575969480595144e-06, "loss": 1.1107, "step": 11693 }, { "epoch": 0.35, "learning_rate": 3.75738613079622e-06, "loss": 1.2227, "step": 11694 }, { "epoch": 0.35, "learning_rate": 3.757175301563215e-06, "loss": 1.1287, "step": 11695 }, { "epoch": 0.35, "learning_rate": 3.7569644603625064e-06, "loss": 1.0626, "step": 11696 }, { "epoch": 0.35, "learning_rate": 3.756753607196102e-06, "loss": 1.2933, "step": 11697 }, { "epoch": 0.35, "learning_rate": 3.756542742066008e-06, "loss": 1.1819, "step": 11698 }, { "epoch": 0.35, "learning_rate": 3.756331864974233e-06, "loss": 1.1089, "step": 11699 }, { "epoch": 0.35, "learning_rate": 3.7561209759227834e-06, "loss": 1.162, "step": 11700 }, { "epoch": 0.35, "learning_rate": 3.7559100749136667e-06, "loss": 1.1929, "step": 11701 }, { "epoch": 0.35, "learning_rate": 3.7556991619488913e-06, "loss": 1.1325, "step": 11702 }, { "epoch": 0.35, "learning_rate": 3.755488237030465e-06, "loss": 1.0609, "step": 11703 }, { "epoch": 0.35, "learning_rate": 3.7552773001603947e-06, "loss": 1.1233, "step": 11704 }, { "epoch": 0.35, "learning_rate": 3.75506635134069e-06, "loss": 1.1355, "step": 11705 }, { "epoch": 0.35, "learning_rate": 3.754855390573357e-06, "loss": 1.067, "step": 11706 }, { "epoch": 0.35, "learning_rate": 3.7546444178604056e-06, "loss": 1.1366, "step": 11707 }, { "epoch": 0.35, "learning_rate": 3.7544334332038436e-06, "loss": 1.1355, "step": 11708 }, { "epoch": 0.35, "learning_rate": 3.754222436605679e-06, "loss": 1.1851, "step": 11709 }, { "epoch": 0.35, "learning_rate": 3.7540114280679214e-06, "loss": 1.2003, "step": 11710 }, { "epoch": 0.35, "learning_rate": 3.753800407592578e-06, "loss": 1.218, "step": 11711 }, { "epoch": 0.35, "learning_rate": 3.75358937518166e-06, "loss": 1.1575, "step": 11712 }, { "epoch": 0.35, "learning_rate": 3.7533783308371742e-06, "loss": 1.0385, "step": 11713 }, { "epoch": 0.35, "learning_rate": 3.75316727456113e-06, "loss": 1.166, "step": 11714 }, { "epoch": 0.35, "learning_rate": 3.7529562063555375e-06, "loss": 1.1235, "step": 11715 }, { "epoch": 0.35, "learning_rate": 3.7527451262224055e-06, "loss": 1.0765, "step": 11716 }, { "epoch": 0.35, "learning_rate": 3.752534034163743e-06, "loss": 1.1701, "step": 11717 }, { "epoch": 0.35, "learning_rate": 3.7523229301815594e-06, "loss": 1.1407, "step": 11718 }, { "epoch": 0.35, "learning_rate": 3.7521118142778644e-06, "loss": 1.0695, "step": 11719 }, { "epoch": 0.35, "learning_rate": 3.7519006864546693e-06, "loss": 1.2526, "step": 11720 }, { "epoch": 0.35, "learning_rate": 3.7516895467139814e-06, "loss": 0.9993, "step": 11721 }, { "epoch": 0.35, "learning_rate": 3.7514783950578113e-06, "loss": 1.1353, "step": 11722 }, { "epoch": 0.35, "learning_rate": 3.751267231488171e-06, "loss": 1.1438, "step": 11723 }, { "epoch": 0.35, "learning_rate": 3.7510560560070687e-06, "loss": 0.9665, "step": 11724 }, { "epoch": 0.35, "learning_rate": 3.7508448686165153e-06, "loss": 1.1051, "step": 11725 }, { "epoch": 0.35, "learning_rate": 3.750633669318521e-06, "loss": 1.0854, "step": 11726 }, { "epoch": 0.35, "learning_rate": 3.750422458115097e-06, "loss": 1.063, "step": 11727 }, { "epoch": 0.35, "learning_rate": 3.750211235008253e-06, "loss": 1.0837, "step": 11728 }, { "epoch": 0.35, "learning_rate": 3.7500000000000005e-06, "loss": 1.2133, "step": 11729 }, { "epoch": 0.35, "learning_rate": 3.7497887530923493e-06, "loss": 1.1534, "step": 11730 }, { "epoch": 0.35, "learning_rate": 3.749577494287312e-06, "loss": 1.1332, "step": 11731 }, { "epoch": 0.35, "learning_rate": 3.749366223586898e-06, "loss": 1.1259, "step": 11732 }, { "epoch": 0.35, "learning_rate": 3.7491549409931204e-06, "loss": 1.1632, "step": 11733 }, { "epoch": 0.35, "learning_rate": 3.748943646507989e-06, "loss": 1.1445, "step": 11734 }, { "epoch": 0.35, "learning_rate": 3.7487323401335146e-06, "loss": 1.0917, "step": 11735 }, { "epoch": 0.35, "learning_rate": 3.74852102187171e-06, "loss": 1.165, "step": 11736 }, { "epoch": 0.35, "learning_rate": 3.7483096917245866e-06, "loss": 1.1645, "step": 11737 }, { "epoch": 0.35, "learning_rate": 3.748098349694157e-06, "loss": 1.1656, "step": 11738 }, { "epoch": 0.35, "learning_rate": 3.7478869957824315e-06, "loss": 0.9963, "step": 11739 }, { "epoch": 0.35, "learning_rate": 3.747675629991423e-06, "loss": 1.0436, "step": 11740 }, { "epoch": 0.35, "learning_rate": 3.747464252323143e-06, "loss": 1.1984, "step": 11741 }, { "epoch": 0.35, "learning_rate": 3.747252862779605e-06, "loss": 1.1801, "step": 11742 }, { "epoch": 0.35, "learning_rate": 3.7470414613628196e-06, "loss": 1.1226, "step": 11743 }, { "epoch": 0.35, "learning_rate": 3.746830048074801e-06, "loss": 1.1779, "step": 11744 }, { "epoch": 0.35, "learning_rate": 3.74661862291756e-06, "loss": 1.0593, "step": 11745 }, { "epoch": 0.35, "learning_rate": 3.7464071858931106e-06, "loss": 1.1439, "step": 11746 }, { "epoch": 0.35, "learning_rate": 3.746195737003465e-06, "loss": 1.084, "step": 11747 }, { "epoch": 0.35, "learning_rate": 3.745984276250636e-06, "loss": 0.9449, "step": 11748 }, { "epoch": 0.35, "learning_rate": 3.745772803636637e-06, "loss": 1.166, "step": 11749 }, { "epoch": 0.35, "learning_rate": 3.7455613191634805e-06, "loss": 1.0461, "step": 11750 }, { "epoch": 0.35, "learning_rate": 3.7453498228331798e-06, "loss": 1.063, "step": 11751 }, { "epoch": 0.35, "learning_rate": 3.745138314647749e-06, "loss": 1.075, "step": 11752 }, { "epoch": 0.35, "learning_rate": 3.7449267946092017e-06, "loss": 1.1021, "step": 11753 }, { "epoch": 0.35, "learning_rate": 3.74471526271955e-06, "loss": 1.1351, "step": 11754 }, { "epoch": 0.35, "learning_rate": 3.744503718980809e-06, "loss": 1.3168, "step": 11755 }, { "epoch": 0.35, "learning_rate": 3.7442921633949917e-06, "loss": 1.091, "step": 11756 }, { "epoch": 0.35, "learning_rate": 3.744080595964113e-06, "loss": 1.1584, "step": 11757 }, { "epoch": 0.35, "learning_rate": 3.7438690166901854e-06, "loss": 1.1551, "step": 11758 }, { "epoch": 0.35, "learning_rate": 3.7436574255752246e-06, "loss": 1.157, "step": 11759 }, { "epoch": 0.35, "learning_rate": 3.743445822621243e-06, "loss": 1.2008, "step": 11760 }, { "epoch": 0.35, "learning_rate": 3.7432342078302563e-06, "loss": 1.1216, "step": 11761 }, { "epoch": 0.35, "learning_rate": 3.743022581204279e-06, "loss": 1.1517, "step": 11762 }, { "epoch": 0.35, "learning_rate": 3.742810942745325e-06, "loss": 1.1605, "step": 11763 }, { "epoch": 0.35, "learning_rate": 3.74259929245541e-06, "loss": 1.1515, "step": 11764 }, { "epoch": 0.35, "learning_rate": 3.742387630336548e-06, "loss": 1.2144, "step": 11765 }, { "epoch": 0.35, "learning_rate": 3.742175956390754e-06, "loss": 1.0444, "step": 11766 }, { "epoch": 0.35, "learning_rate": 3.741964270620043e-06, "loss": 1.1575, "step": 11767 }, { "epoch": 0.35, "learning_rate": 3.741752573026431e-06, "loss": 1.1555, "step": 11768 }, { "epoch": 0.35, "learning_rate": 3.7415408636119315e-06, "loss": 1.1666, "step": 11769 }, { "epoch": 0.35, "learning_rate": 3.741329142378562e-06, "loss": 1.2279, "step": 11770 }, { "epoch": 0.35, "learning_rate": 3.7411174093283367e-06, "loss": 1.2053, "step": 11771 }, { "epoch": 0.35, "learning_rate": 3.740905664463271e-06, "loss": 1.0906, "step": 11772 }, { "epoch": 0.35, "learning_rate": 3.740693907785381e-06, "loss": 1.0375, "step": 11773 }, { "epoch": 0.35, "learning_rate": 3.7404821392966823e-06, "loss": 1.17, "step": 11774 }, { "epoch": 0.35, "learning_rate": 3.7402703589991917e-06, "loss": 1.2852, "step": 11775 }, { "epoch": 0.35, "learning_rate": 3.740058566894924e-06, "loss": 1.0644, "step": 11776 }, { "epoch": 0.35, "learning_rate": 3.7398467629858957e-06, "loss": 1.183, "step": 11777 }, { "epoch": 0.35, "learning_rate": 3.739634947274124e-06, "loss": 1.0477, "step": 11778 }, { "epoch": 0.35, "learning_rate": 3.7394231197616248e-06, "loss": 1.1368, "step": 11779 }, { "epoch": 0.35, "learning_rate": 3.7392112804504144e-06, "loss": 1.2888, "step": 11780 }, { "epoch": 0.35, "learning_rate": 3.7389994293425093e-06, "loss": 1.1457, "step": 11781 }, { "epoch": 0.35, "learning_rate": 3.7387875664399257e-06, "loss": 1.101, "step": 11782 }, { "epoch": 0.35, "learning_rate": 3.7385756917446827e-06, "loss": 1.0768, "step": 11783 }, { "epoch": 0.35, "learning_rate": 3.738363805258794e-06, "loss": 1.1381, "step": 11784 }, { "epoch": 0.36, "learning_rate": 3.7381519069842793e-06, "loss": 1.1242, "step": 11785 }, { "epoch": 0.36, "learning_rate": 3.7379399969231537e-06, "loss": 1.1853, "step": 11786 }, { "epoch": 0.36, "learning_rate": 3.7377280750774363e-06, "loss": 1.2363, "step": 11787 }, { "epoch": 0.36, "learning_rate": 3.737516141449144e-06, "loss": 1.107, "step": 11788 }, { "epoch": 0.36, "learning_rate": 3.7373041960402935e-06, "loss": 1.1376, "step": 11789 }, { "epoch": 0.36, "learning_rate": 3.7370922388529035e-06, "loss": 1.0613, "step": 11790 }, { "epoch": 0.36, "learning_rate": 3.7368802698889904e-06, "loss": 1.1469, "step": 11791 }, { "epoch": 0.36, "learning_rate": 3.7366682891505734e-06, "loss": 1.1947, "step": 11792 }, { "epoch": 0.36, "learning_rate": 3.7364562966396695e-06, "loss": 1.2004, "step": 11793 }, { "epoch": 0.36, "learning_rate": 3.7362442923582975e-06, "loss": 1.2073, "step": 11794 }, { "epoch": 0.36, "learning_rate": 3.736032276308475e-06, "loss": 1.1133, "step": 11795 }, { "epoch": 0.36, "learning_rate": 3.735820248492221e-06, "loss": 1.0814, "step": 11796 }, { "epoch": 0.36, "learning_rate": 3.735608208911553e-06, "loss": 1.1755, "step": 11797 }, { "epoch": 0.36, "learning_rate": 3.7353961575684897e-06, "loss": 1.1383, "step": 11798 }, { "epoch": 0.36, "learning_rate": 3.7351840944650507e-06, "loss": 1.1097, "step": 11799 }, { "epoch": 0.36, "learning_rate": 3.7349720196032535e-06, "loss": 1.1594, "step": 11800 }, { "epoch": 0.36, "learning_rate": 3.7347599329851177e-06, "loss": 1.2192, "step": 11801 }, { "epoch": 0.36, "learning_rate": 3.734547834612662e-06, "loss": 1.1062, "step": 11802 }, { "epoch": 0.36, "learning_rate": 3.7343357244879053e-06, "loss": 1.0569, "step": 11803 }, { "epoch": 0.36, "learning_rate": 3.7341236026128667e-06, "loss": 1.1141, "step": 11804 }, { "epoch": 0.36, "learning_rate": 3.733911468989566e-06, "loss": 1.1483, "step": 11805 }, { "epoch": 0.36, "learning_rate": 3.7336993236200223e-06, "loss": 1.1891, "step": 11806 }, { "epoch": 0.36, "learning_rate": 3.7334871665062557e-06, "loss": 1.1553, "step": 11807 }, { "epoch": 0.36, "learning_rate": 3.7332749976502847e-06, "loss": 1.0936, "step": 11808 }, { "epoch": 0.36, "learning_rate": 3.7330628170541305e-06, "loss": 1.1539, "step": 11809 }, { "epoch": 0.36, "learning_rate": 3.7328506247198115e-06, "loss": 1.1149, "step": 11810 }, { "epoch": 0.36, "learning_rate": 3.7326384206493487e-06, "loss": 1.1707, "step": 11811 }, { "epoch": 0.36, "learning_rate": 3.7324262048447614e-06, "loss": 1.1327, "step": 11812 }, { "epoch": 0.36, "learning_rate": 3.7322139773080708e-06, "loss": 1.0891, "step": 11813 }, { "epoch": 0.36, "learning_rate": 3.732001738041296e-06, "loss": 1.1768, "step": 11814 }, { "epoch": 0.36, "learning_rate": 3.7317894870464577e-06, "loss": 1.098, "step": 11815 }, { "epoch": 0.36, "learning_rate": 3.731577224325578e-06, "loss": 1.1487, "step": 11816 }, { "epoch": 0.36, "learning_rate": 3.7313649498806747e-06, "loss": 1.1139, "step": 11817 }, { "epoch": 0.36, "learning_rate": 3.731152663713771e-06, "loss": 1.2698, "step": 11818 }, { "epoch": 0.36, "learning_rate": 3.7309403658268866e-06, "loss": 1.1643, "step": 11819 }, { "epoch": 0.36, "learning_rate": 3.730728056222043e-06, "loss": 1.0996, "step": 11820 }, { "epoch": 0.36, "learning_rate": 3.730515734901261e-06, "loss": 1.1241, "step": 11821 }, { "epoch": 0.36, "learning_rate": 3.730303401866562e-06, "loss": 1.008, "step": 11822 }, { "epoch": 0.36, "learning_rate": 3.7300910571199667e-06, "loss": 1.1548, "step": 11823 }, { "epoch": 0.36, "learning_rate": 3.7298787006634977e-06, "loss": 1.1334, "step": 11824 }, { "epoch": 0.36, "learning_rate": 3.7296663324991755e-06, "loss": 1.3195, "step": 11825 }, { "epoch": 0.36, "learning_rate": 3.7294539526290218e-06, "loss": 1.1526, "step": 11826 }, { "epoch": 0.36, "learning_rate": 3.7292415610550585e-06, "loss": 1.1743, "step": 11827 }, { "epoch": 0.36, "learning_rate": 3.729029157779308e-06, "loss": 1.0452, "step": 11828 }, { "epoch": 0.36, "learning_rate": 3.7288167428037912e-06, "loss": 1.1989, "step": 11829 }, { "epoch": 0.36, "learning_rate": 3.7286043161305313e-06, "loss": 1.1887, "step": 11830 }, { "epoch": 0.36, "learning_rate": 3.72839187776155e-06, "loss": 1.188, "step": 11831 }, { "epoch": 0.36, "learning_rate": 3.7281794276988697e-06, "loss": 1.1467, "step": 11832 }, { "epoch": 0.36, "learning_rate": 3.727966965944513e-06, "loss": 1.1127, "step": 11833 }, { "epoch": 0.36, "learning_rate": 3.727754492500501e-06, "loss": 1.1484, "step": 11834 }, { "epoch": 0.36, "learning_rate": 3.727542007368859e-06, "loss": 1.053, "step": 11835 }, { "epoch": 0.36, "learning_rate": 3.7273295105516073e-06, "loss": 1.1124, "step": 11836 }, { "epoch": 0.36, "learning_rate": 3.7271170020507706e-06, "loss": 1.2007, "step": 11837 }, { "epoch": 0.36, "learning_rate": 3.7269044818683705e-06, "loss": 1.2303, "step": 11838 }, { "epoch": 0.36, "learning_rate": 3.7266919500064307e-06, "loss": 1.0272, "step": 11839 }, { "epoch": 0.36, "learning_rate": 3.726479406466974e-06, "loss": 1.1082, "step": 11840 }, { "epoch": 0.36, "learning_rate": 3.7262668512520244e-06, "loss": 1.0955, "step": 11841 }, { "epoch": 0.36, "learning_rate": 3.726054284363605e-06, "loss": 1.1929, "step": 11842 }, { "epoch": 0.36, "learning_rate": 3.7258417058037394e-06, "loss": 1.1628, "step": 11843 }, { "epoch": 0.36, "learning_rate": 3.725629115574451e-06, "loss": 1.2778, "step": 11844 }, { "epoch": 0.36, "learning_rate": 3.7254165136777636e-06, "loss": 1.1714, "step": 11845 }, { "epoch": 0.36, "learning_rate": 3.725203900115701e-06, "loss": 1.0185, "step": 11846 }, { "epoch": 0.36, "learning_rate": 3.7249912748902873e-06, "loss": 1.1248, "step": 11847 }, { "epoch": 0.36, "learning_rate": 3.724778638003548e-06, "loss": 1.2518, "step": 11848 }, { "epoch": 0.36, "learning_rate": 3.724565989457504e-06, "loss": 1.1107, "step": 11849 }, { "epoch": 0.36, "learning_rate": 3.7243533292541826e-06, "loss": 1.229, "step": 11850 }, { "epoch": 0.36, "learning_rate": 3.724140657395607e-06, "loss": 1.1642, "step": 11851 }, { "epoch": 0.36, "learning_rate": 3.7239279738838024e-06, "loss": 1.0197, "step": 11852 }, { "epoch": 0.36, "learning_rate": 3.723715278720792e-06, "loss": 1.0107, "step": 11853 }, { "epoch": 0.36, "learning_rate": 3.723502571908602e-06, "loss": 1.1661, "step": 11854 }, { "epoch": 0.36, "learning_rate": 3.723289853449257e-06, "loss": 1.174, "step": 11855 }, { "epoch": 0.36, "learning_rate": 3.7230771233447815e-06, "loss": 1.0371, "step": 11856 }, { "epoch": 0.36, "learning_rate": 3.722864381597201e-06, "loss": 1.0942, "step": 11857 }, { "epoch": 0.36, "learning_rate": 3.72265162820854e-06, "loss": 1.0543, "step": 11858 }, { "epoch": 0.36, "learning_rate": 3.722438863180825e-06, "loss": 1.1884, "step": 11859 }, { "epoch": 0.36, "learning_rate": 3.72222608651608e-06, "loss": 1.1366, "step": 11860 }, { "epoch": 0.36, "learning_rate": 3.722013298216332e-06, "loss": 1.1669, "step": 11861 }, { "epoch": 0.36, "learning_rate": 3.721800498283606e-06, "loss": 1.2166, "step": 11862 }, { "epoch": 0.36, "learning_rate": 3.7215876867199273e-06, "loss": 1.1056, "step": 11863 }, { "epoch": 0.36, "learning_rate": 3.721374863527322e-06, "loss": 1.0165, "step": 11864 }, { "epoch": 0.36, "learning_rate": 3.721162028707817e-06, "loss": 1.0969, "step": 11865 }, { "epoch": 0.36, "learning_rate": 3.720949182263437e-06, "loss": 1.1469, "step": 11866 }, { "epoch": 0.36, "learning_rate": 3.720736324196209e-06, "loss": 1.1122, "step": 11867 }, { "epoch": 0.36, "learning_rate": 3.720523454508159e-06, "loss": 1.3024, "step": 11868 }, { "epoch": 0.36, "learning_rate": 3.7203105732013134e-06, "loss": 1.2075, "step": 11869 }, { "epoch": 0.36, "learning_rate": 3.7200976802777e-06, "loss": 1.1151, "step": 11870 }, { "epoch": 0.36, "learning_rate": 3.719884775739343e-06, "loss": 1.0901, "step": 11871 }, { "epoch": 0.36, "learning_rate": 3.719671859588271e-06, "loss": 1.1489, "step": 11872 }, { "epoch": 0.36, "learning_rate": 3.71945893182651e-06, "loss": 1.1511, "step": 11873 }, { "epoch": 0.36, "learning_rate": 3.7192459924560877e-06, "loss": 1.2379, "step": 11874 }, { "epoch": 0.36, "learning_rate": 3.71903304147903e-06, "loss": 1.2065, "step": 11875 }, { "epoch": 0.36, "learning_rate": 3.7188200788973654e-06, "loss": 1.0596, "step": 11876 }, { "epoch": 0.36, "learning_rate": 3.7186071047131206e-06, "loss": 1.1007, "step": 11877 }, { "epoch": 0.36, "learning_rate": 3.7183941189283234e-06, "loss": 1.1036, "step": 11878 }, { "epoch": 0.36, "learning_rate": 3.7181811215450003e-06, "loss": 1.1581, "step": 11879 }, { "epoch": 0.36, "learning_rate": 3.71796811256518e-06, "loss": 1.1671, "step": 11880 }, { "epoch": 0.36, "learning_rate": 3.71775509199089e-06, "loss": 1.1053, "step": 11881 }, { "epoch": 0.36, "learning_rate": 3.7175420598241573e-06, "loss": 1.0908, "step": 11882 }, { "epoch": 0.36, "learning_rate": 3.7173290160670115e-06, "loss": 1.1208, "step": 11883 }, { "epoch": 0.36, "learning_rate": 3.7171159607214796e-06, "loss": 1.0919, "step": 11884 }, { "epoch": 0.36, "learning_rate": 3.7169028937895903e-06, "loss": 1.0853, "step": 11885 }, { "epoch": 0.36, "learning_rate": 3.7166898152733705e-06, "loss": 1.2646, "step": 11886 }, { "epoch": 0.36, "learning_rate": 3.7164767251748497e-06, "loss": 1.0585, "step": 11887 }, { "epoch": 0.36, "learning_rate": 3.7162636234960566e-06, "loss": 1.1478, "step": 11888 }, { "epoch": 0.36, "learning_rate": 3.7160505102390197e-06, "loss": 1.2374, "step": 11889 }, { "epoch": 0.36, "learning_rate": 3.715837385405768e-06, "loss": 1.1207, "step": 11890 }, { "epoch": 0.36, "learning_rate": 3.7156242489983295e-06, "loss": 1.0692, "step": 11891 }, { "epoch": 0.36, "learning_rate": 3.715411101018734e-06, "loss": 1.1829, "step": 11892 }, { "epoch": 0.36, "learning_rate": 3.7151979414690094e-06, "loss": 1.2192, "step": 11893 }, { "epoch": 0.36, "learning_rate": 3.7149847703511867e-06, "loss": 1.1317, "step": 11894 }, { "epoch": 0.36, "learning_rate": 3.714771587667293e-06, "loss": 1.1854, "step": 11895 }, { "epoch": 0.36, "learning_rate": 3.71455839341936e-06, "loss": 1.0573, "step": 11896 }, { "epoch": 0.36, "learning_rate": 3.714345187609415e-06, "loss": 1.0896, "step": 11897 }, { "epoch": 0.36, "learning_rate": 3.7141319702394895e-06, "loss": 1.121, "step": 11898 }, { "epoch": 0.36, "learning_rate": 3.713918741311612e-06, "loss": 1.2087, "step": 11899 }, { "epoch": 0.36, "learning_rate": 3.7137055008278122e-06, "loss": 1.1501, "step": 11900 }, { "epoch": 0.36, "learning_rate": 3.7134922487901207e-06, "loss": 1.1335, "step": 11901 }, { "epoch": 0.36, "learning_rate": 3.7132789852005685e-06, "loss": 1.161, "step": 11902 }, { "epoch": 0.36, "learning_rate": 3.7130657100611837e-06, "loss": 1.071, "step": 11903 }, { "epoch": 0.36, "learning_rate": 3.712852423373998e-06, "loss": 1.2232, "step": 11904 }, { "epoch": 0.36, "learning_rate": 3.7126391251410413e-06, "loss": 1.1774, "step": 11905 }, { "epoch": 0.36, "learning_rate": 3.7124258153643444e-06, "loss": 1.2057, "step": 11906 }, { "epoch": 0.36, "learning_rate": 3.7122124940459376e-06, "loss": 1.1401, "step": 11907 }, { "epoch": 0.36, "learning_rate": 3.7119991611878516e-06, "loss": 1.1312, "step": 11908 }, { "epoch": 0.36, "learning_rate": 3.7117858167921172e-06, "loss": 1.0419, "step": 11909 }, { "epoch": 0.36, "learning_rate": 3.7115724608607653e-06, "loss": 1.1383, "step": 11910 }, { "epoch": 0.36, "learning_rate": 3.7113590933958273e-06, "loss": 1.1129, "step": 11911 }, { "epoch": 0.36, "learning_rate": 3.7111457143993336e-06, "loss": 1.2255, "step": 11912 }, { "epoch": 0.36, "learning_rate": 3.7109323238733168e-06, "loss": 1.2382, "step": 11913 }, { "epoch": 0.36, "learning_rate": 3.710718921819807e-06, "loss": 1.1889, "step": 11914 }, { "epoch": 0.36, "learning_rate": 3.710505508240836e-06, "loss": 1.2347, "step": 11915 }, { "epoch": 0.36, "learning_rate": 3.7102920831384357e-06, "loss": 1.1216, "step": 11916 }, { "epoch": 0.36, "learning_rate": 3.7100786465146383e-06, "loss": 1.1727, "step": 11917 }, { "epoch": 0.36, "learning_rate": 3.709865198371474e-06, "loss": 1.1201, "step": 11918 }, { "epoch": 0.36, "learning_rate": 3.7096517387109765e-06, "loss": 1.1491, "step": 11919 }, { "epoch": 0.36, "learning_rate": 3.709438267535177e-06, "loss": 1.1499, "step": 11920 }, { "epoch": 0.36, "learning_rate": 3.7092247848461073e-06, "loss": 1.1588, "step": 11921 }, { "epoch": 0.36, "learning_rate": 3.7090112906458004e-06, "loss": 1.1657, "step": 11922 }, { "epoch": 0.36, "learning_rate": 3.7087977849362877e-06, "loss": 1.0206, "step": 11923 }, { "epoch": 0.36, "learning_rate": 3.7085842677196025e-06, "loss": 1.2214, "step": 11924 }, { "epoch": 0.36, "learning_rate": 3.7083707389977776e-06, "loss": 1.1285, "step": 11925 }, { "epoch": 0.36, "learning_rate": 3.708157198772845e-06, "loss": 1.126, "step": 11926 }, { "epoch": 0.36, "learning_rate": 3.7079436470468377e-06, "loss": 1.0719, "step": 11927 }, { "epoch": 0.36, "learning_rate": 3.7077300838217876e-06, "loss": 1.1903, "step": 11928 }, { "epoch": 0.36, "learning_rate": 3.7075165090997302e-06, "loss": 1.1042, "step": 11929 }, { "epoch": 0.36, "learning_rate": 3.7073029228826967e-06, "loss": 1.0676, "step": 11930 }, { "epoch": 0.36, "learning_rate": 3.707089325172721e-06, "loss": 1.039, "step": 11931 }, { "epoch": 0.36, "learning_rate": 3.706875715971836e-06, "loss": 1.1235, "step": 11932 }, { "epoch": 0.36, "learning_rate": 3.7066620952820754e-06, "loss": 1.1314, "step": 11933 }, { "epoch": 0.36, "learning_rate": 3.7064484631054733e-06, "loss": 1.045, "step": 11934 }, { "epoch": 0.36, "learning_rate": 3.706234819444062e-06, "loss": 1.134, "step": 11935 }, { "epoch": 0.36, "learning_rate": 3.706021164299877e-06, "loss": 1.1348, "step": 11936 }, { "epoch": 0.36, "learning_rate": 3.7058074976749516e-06, "loss": 1.2366, "step": 11937 }, { "epoch": 0.36, "learning_rate": 3.7055938195713185e-06, "loss": 1.21, "step": 11938 }, { "epoch": 0.36, "learning_rate": 3.705380129991014e-06, "loss": 1.2109, "step": 11939 }, { "epoch": 0.36, "learning_rate": 3.70516642893607e-06, "loss": 1.1665, "step": 11940 }, { "epoch": 0.36, "learning_rate": 3.7049527164085232e-06, "loss": 1.1675, "step": 11941 }, { "epoch": 0.36, "learning_rate": 3.7047389924104055e-06, "loss": 1.229, "step": 11942 }, { "epoch": 0.36, "learning_rate": 3.704525256943754e-06, "loss": 1.1129, "step": 11943 }, { "epoch": 0.36, "learning_rate": 3.7043115100106018e-06, "loss": 1.1077, "step": 11944 }, { "epoch": 0.36, "learning_rate": 3.704097751612984e-06, "loss": 1.1953, "step": 11945 }, { "epoch": 0.36, "learning_rate": 3.7038839817529352e-06, "loss": 1.0797, "step": 11946 }, { "epoch": 0.36, "learning_rate": 3.703670200432491e-06, "loss": 1.1749, "step": 11947 }, { "epoch": 0.36, "learning_rate": 3.703456407653687e-06, "loss": 1.2271, "step": 11948 }, { "epoch": 0.36, "learning_rate": 3.7032426034185563e-06, "loss": 1.0971, "step": 11949 }, { "epoch": 0.36, "learning_rate": 3.7030287877291364e-06, "loss": 1.2394, "step": 11950 }, { "epoch": 0.36, "learning_rate": 3.7028149605874614e-06, "loss": 1.0966, "step": 11951 }, { "epoch": 0.36, "learning_rate": 3.7026011219955674e-06, "loss": 1.1478, "step": 11952 }, { "epoch": 0.36, "learning_rate": 3.70238727195549e-06, "loss": 1.1492, "step": 11953 }, { "epoch": 0.36, "learning_rate": 3.7021734104692645e-06, "loss": 1.1104, "step": 11954 }, { "epoch": 0.36, "learning_rate": 3.701959537538927e-06, "loss": 1.2002, "step": 11955 }, { "epoch": 0.36, "learning_rate": 3.701745653166514e-06, "loss": 1.2416, "step": 11956 }, { "epoch": 0.36, "learning_rate": 3.701531757354061e-06, "loss": 1.262, "step": 11957 }, { "epoch": 0.36, "learning_rate": 3.701317850103605e-06, "loss": 1.166, "step": 11958 }, { "epoch": 0.36, "learning_rate": 3.701103931417181e-06, "loss": 1.0295, "step": 11959 }, { "epoch": 0.36, "learning_rate": 3.700890001296826e-06, "loss": 1.1083, "step": 11960 }, { "epoch": 0.36, "learning_rate": 3.7006760597445768e-06, "loss": 1.2328, "step": 11961 }, { "epoch": 0.36, "learning_rate": 3.7004621067624698e-06, "loss": 1.2324, "step": 11962 }, { "epoch": 0.36, "learning_rate": 3.7002481423525416e-06, "loss": 1.0969, "step": 11963 }, { "epoch": 0.36, "learning_rate": 3.700034166516829e-06, "loss": 1.1952, "step": 11964 }, { "epoch": 0.36, "learning_rate": 3.6998201792573694e-06, "loss": 1.122, "step": 11965 }, { "epoch": 0.36, "learning_rate": 3.699606180576199e-06, "loss": 1.1899, "step": 11966 }, { "epoch": 0.36, "learning_rate": 3.6993921704753564e-06, "loss": 1.1599, "step": 11967 }, { "epoch": 0.36, "learning_rate": 3.6991781489568775e-06, "loss": 1.1671, "step": 11968 }, { "epoch": 0.36, "learning_rate": 3.6989641160227995e-06, "loss": 1.0763, "step": 11969 }, { "epoch": 0.36, "learning_rate": 3.6987500716751614e-06, "loss": 1.1642, "step": 11970 }, { "epoch": 0.36, "learning_rate": 3.6985360159159998e-06, "loss": 1.1624, "step": 11971 }, { "epoch": 0.36, "learning_rate": 3.6983219487473522e-06, "loss": 1.106, "step": 11972 }, { "epoch": 0.36, "learning_rate": 3.698107870171257e-06, "loss": 1.1735, "step": 11973 }, { "epoch": 0.36, "learning_rate": 3.697893780189752e-06, "loss": 1.1478, "step": 11974 }, { "epoch": 0.36, "learning_rate": 3.6976796788048752e-06, "loss": 1.1863, "step": 11975 }, { "epoch": 0.36, "learning_rate": 3.6974655660186648e-06, "loss": 1.1024, "step": 11976 }, { "epoch": 0.36, "learning_rate": 3.6972514418331586e-06, "loss": 1.1299, "step": 11977 }, { "epoch": 0.36, "learning_rate": 3.6970373062503956e-06, "loss": 1.0894, "step": 11978 }, { "epoch": 0.36, "learning_rate": 3.6968231592724136e-06, "loss": 1.1033, "step": 11979 }, { "epoch": 0.36, "learning_rate": 3.6966090009012523e-06, "loss": 1.0971, "step": 11980 }, { "epoch": 0.36, "learning_rate": 3.6963948311389484e-06, "loss": 1.2021, "step": 11981 }, { "epoch": 0.36, "learning_rate": 3.6961806499875425e-06, "loss": 1.1185, "step": 11982 }, { "epoch": 0.36, "learning_rate": 3.6959664574490728e-06, "loss": 1.0904, "step": 11983 }, { "epoch": 0.36, "learning_rate": 3.6957522535255786e-06, "loss": 1.095, "step": 11984 }, { "epoch": 0.36, "learning_rate": 3.6955380382190988e-06, "loss": 1.1878, "step": 11985 }, { "epoch": 0.36, "learning_rate": 3.6953238115316725e-06, "loss": 1.3005, "step": 11986 }, { "epoch": 0.36, "learning_rate": 3.69510957346534e-06, "loss": 1.1558, "step": 11987 }, { "epoch": 0.36, "learning_rate": 3.6948953240221384e-06, "loss": 1.0933, "step": 11988 }, { "epoch": 0.36, "learning_rate": 3.6946810632041108e-06, "loss": 1.1364, "step": 11989 }, { "epoch": 0.36, "learning_rate": 3.694466791013293e-06, "loss": 1.1009, "step": 11990 }, { "epoch": 0.36, "learning_rate": 3.694252507451728e-06, "loss": 1.1923, "step": 11991 }, { "epoch": 0.36, "learning_rate": 3.6940382125214536e-06, "loss": 1.0959, "step": 11992 }, { "epoch": 0.36, "learning_rate": 3.6938239062245105e-06, "loss": 1.2197, "step": 11993 }, { "epoch": 0.36, "learning_rate": 3.6936095885629387e-06, "loss": 1.0339, "step": 11994 }, { "epoch": 0.36, "learning_rate": 3.693395259538779e-06, "loss": 1.1312, "step": 11995 }, { "epoch": 0.36, "learning_rate": 3.6931809191540706e-06, "loss": 1.0832, "step": 11996 }, { "epoch": 0.36, "learning_rate": 3.692966567410855e-06, "loss": 1.1598, "step": 11997 }, { "epoch": 0.36, "learning_rate": 3.692752204311172e-06, "loss": 1.0975, "step": 11998 }, { "epoch": 0.36, "learning_rate": 3.6925378298570624e-06, "loss": 1.116, "step": 11999 }, { "epoch": 0.36, "learning_rate": 3.6923234440505667e-06, "loss": 1.2745, "step": 12000 }, { "epoch": 0.36, "learning_rate": 3.692109046893726e-06, "loss": 1.1385, "step": 12001 }, { "epoch": 0.36, "learning_rate": 3.6918946383885823e-06, "loss": 1.1006, "step": 12002 }, { "epoch": 0.36, "learning_rate": 3.691680218537175e-06, "loss": 1.0156, "step": 12003 }, { "epoch": 0.36, "learning_rate": 3.691465787341546e-06, "loss": 1.0594, "step": 12004 }, { "epoch": 0.36, "learning_rate": 3.6912513448037367e-06, "loss": 1.2352, "step": 12005 }, { "epoch": 0.36, "learning_rate": 3.691036890925788e-06, "loss": 1.1906, "step": 12006 }, { "epoch": 0.36, "learning_rate": 3.690822425709742e-06, "loss": 1.1141, "step": 12007 }, { "epoch": 0.36, "learning_rate": 3.6906079491576403e-06, "loss": 1.2064, "step": 12008 }, { "epoch": 0.36, "learning_rate": 3.6903934612715238e-06, "loss": 1.0897, "step": 12009 }, { "epoch": 0.36, "learning_rate": 3.690178962053435e-06, "loss": 1.1018, "step": 12010 }, { "epoch": 0.36, "learning_rate": 3.689964451505416e-06, "loss": 1.0655, "step": 12011 }, { "epoch": 0.36, "learning_rate": 3.689749929629508e-06, "loss": 1.0637, "step": 12012 }, { "epoch": 0.36, "learning_rate": 3.6895353964277534e-06, "loss": 1.2949, "step": 12013 }, { "epoch": 0.36, "learning_rate": 3.6893208519021955e-06, "loss": 1.1025, "step": 12014 }, { "epoch": 0.36, "learning_rate": 3.689106296054876e-06, "loss": 1.1224, "step": 12015 }, { "epoch": 0.36, "learning_rate": 3.6888917288878367e-06, "loss": 1.1705, "step": 12016 }, { "epoch": 0.36, "learning_rate": 3.688677150403121e-06, "loss": 1.1038, "step": 12017 }, { "epoch": 0.36, "learning_rate": 3.688462560602771e-06, "loss": 1.1754, "step": 12018 }, { "epoch": 0.36, "learning_rate": 3.6882479594888305e-06, "loss": 1.0867, "step": 12019 }, { "epoch": 0.36, "learning_rate": 3.688033347063341e-06, "loss": 1.1866, "step": 12020 }, { "epoch": 0.36, "learning_rate": 3.6878187233283467e-06, "loss": 1.1064, "step": 12021 }, { "epoch": 0.36, "learning_rate": 3.6876040882858898e-06, "loss": 1.0948, "step": 12022 }, { "epoch": 0.36, "learning_rate": 3.687389441938014e-06, "loss": 1.2351, "step": 12023 }, { "epoch": 0.36, "learning_rate": 3.6871747842867626e-06, "loss": 1.1506, "step": 12024 }, { "epoch": 0.36, "learning_rate": 3.6869601153341793e-06, "loss": 1.082, "step": 12025 }, { "epoch": 0.36, "learning_rate": 3.6867454350823074e-06, "loss": 1.2003, "step": 12026 }, { "epoch": 0.36, "learning_rate": 3.68653074353319e-06, "loss": 1.0965, "step": 12027 }, { "epoch": 0.36, "learning_rate": 3.686316040688872e-06, "loss": 1.0956, "step": 12028 }, { "epoch": 0.36, "learning_rate": 3.686101326551396e-06, "loss": 1.2292, "step": 12029 }, { "epoch": 0.36, "learning_rate": 3.6858866011228072e-06, "loss": 1.2584, "step": 12030 }, { "epoch": 0.36, "learning_rate": 3.685671864405149e-06, "loss": 1.1887, "step": 12031 }, { "epoch": 0.36, "learning_rate": 3.685457116400466e-06, "loss": 1.1329, "step": 12032 }, { "epoch": 0.36, "learning_rate": 3.6852423571108013e-06, "loss": 1.1346, "step": 12033 }, { "epoch": 0.36, "learning_rate": 3.685027586538201e-06, "loss": 1.0687, "step": 12034 }, { "epoch": 0.36, "learning_rate": 3.684812804684708e-06, "loss": 1.0399, "step": 12035 }, { "epoch": 0.36, "learning_rate": 3.6845980115523683e-06, "loss": 1.1442, "step": 12036 }, { "epoch": 0.36, "learning_rate": 3.684383207143226e-06, "loss": 1.1736, "step": 12037 }, { "epoch": 0.36, "learning_rate": 3.6841683914593257e-06, "loss": 1.095, "step": 12038 }, { "epoch": 0.36, "learning_rate": 3.6839535645027123e-06, "loss": 1.1595, "step": 12039 }, { "epoch": 0.36, "learning_rate": 3.683738726275432e-06, "loss": 1.0016, "step": 12040 }, { "epoch": 0.36, "learning_rate": 3.683523876779529e-06, "loss": 1.1589, "step": 12041 }, { "epoch": 0.36, "learning_rate": 3.6833090160170483e-06, "loss": 1.1899, "step": 12042 }, { "epoch": 0.36, "learning_rate": 3.6830941439900362e-06, "loss": 1.2412, "step": 12043 }, { "epoch": 0.36, "learning_rate": 3.682879260700537e-06, "loss": 1.135, "step": 12044 }, { "epoch": 0.36, "learning_rate": 3.682664366150598e-06, "loss": 1.0591, "step": 12045 }, { "epoch": 0.36, "learning_rate": 3.6824494603422627e-06, "loss": 1.1678, "step": 12046 }, { "epoch": 0.36, "learning_rate": 3.6822345432775788e-06, "loss": 1.0627, "step": 12047 }, { "epoch": 0.36, "learning_rate": 3.682019614958591e-06, "loss": 1.2941, "step": 12048 }, { "epoch": 0.36, "learning_rate": 3.681804675387346e-06, "loss": 1.1984, "step": 12049 }, { "epoch": 0.36, "learning_rate": 3.681589724565889e-06, "loss": 1.0892, "step": 12050 }, { "epoch": 0.36, "learning_rate": 3.6813747624962675e-06, "loss": 1.0847, "step": 12051 }, { "epoch": 0.36, "learning_rate": 3.6811597891805266e-06, "loss": 1.0993, "step": 12052 }, { "epoch": 0.36, "learning_rate": 3.6809448046207143e-06, "loss": 1.1091, "step": 12053 }, { "epoch": 0.36, "learning_rate": 3.6807298088188758e-06, "loss": 1.108, "step": 12054 }, { "epoch": 0.36, "learning_rate": 3.6805148017770583e-06, "loss": 1.1607, "step": 12055 }, { "epoch": 0.36, "learning_rate": 3.680299783497308e-06, "loss": 1.1268, "step": 12056 }, { "epoch": 0.36, "learning_rate": 3.6800847539816724e-06, "loss": 1.1381, "step": 12057 }, { "epoch": 0.36, "learning_rate": 3.679869713232199e-06, "loss": 1.1655, "step": 12058 }, { "epoch": 0.36, "learning_rate": 3.6796546612509334e-06, "loss": 1.1046, "step": 12059 }, { "epoch": 0.36, "learning_rate": 3.6794395980399238e-06, "loss": 1.1613, "step": 12060 }, { "epoch": 0.36, "learning_rate": 3.6792245236012168e-06, "loss": 1.1516, "step": 12061 }, { "epoch": 0.36, "learning_rate": 3.6790094379368613e-06, "loss": 1.197, "step": 12062 }, { "epoch": 0.36, "learning_rate": 3.678794341048903e-06, "loss": 1.1991, "step": 12063 }, { "epoch": 0.36, "learning_rate": 3.6785792329393903e-06, "loss": 1.1407, "step": 12064 }, { "epoch": 0.36, "learning_rate": 3.678364113610371e-06, "loss": 1.0605, "step": 12065 }, { "epoch": 0.36, "learning_rate": 3.678148983063893e-06, "loss": 1.1219, "step": 12066 }, { "epoch": 0.36, "learning_rate": 3.6779338413020043e-06, "loss": 1.1687, "step": 12067 }, { "epoch": 0.36, "learning_rate": 3.6777186883267523e-06, "loss": 1.1726, "step": 12068 }, { "epoch": 0.36, "learning_rate": 3.6775035241401857e-06, "loss": 1.0493, "step": 12069 }, { "epoch": 0.36, "learning_rate": 3.6772883487443527e-06, "loss": 1.2999, "step": 12070 }, { "epoch": 0.36, "learning_rate": 3.677073162141302e-06, "loss": 1.1611, "step": 12071 }, { "epoch": 0.36, "learning_rate": 3.6768579643330816e-06, "loss": 1.0867, "step": 12072 }, { "epoch": 0.36, "learning_rate": 3.67664275532174e-06, "loss": 1.1658, "step": 12073 }, { "epoch": 0.36, "learning_rate": 3.676427535109326e-06, "loss": 1.2243, "step": 12074 }, { "epoch": 0.36, "learning_rate": 3.6762123036978886e-06, "loss": 1.0485, "step": 12075 }, { "epoch": 0.36, "learning_rate": 3.675997061089476e-06, "loss": 1.1244, "step": 12076 }, { "epoch": 0.36, "learning_rate": 3.6757818072861385e-06, "loss": 1.0787, "step": 12077 }, { "epoch": 0.36, "learning_rate": 3.675566542289924e-06, "loss": 1.1429, "step": 12078 }, { "epoch": 0.36, "learning_rate": 3.6753512661028823e-06, "loss": 1.1419, "step": 12079 }, { "epoch": 0.36, "learning_rate": 3.675135978727062e-06, "loss": 1.1513, "step": 12080 }, { "epoch": 0.36, "learning_rate": 3.674920680164514e-06, "loss": 1.1326, "step": 12081 }, { "epoch": 0.36, "learning_rate": 3.674705370417287e-06, "loss": 1.1227, "step": 12082 }, { "epoch": 0.36, "learning_rate": 3.67449004948743e-06, "loss": 1.1318, "step": 12083 }, { "epoch": 0.36, "learning_rate": 3.6742747173769942e-06, "loss": 1.0804, "step": 12084 }, { "epoch": 0.36, "learning_rate": 3.6740593740880282e-06, "loss": 1.1572, "step": 12085 }, { "epoch": 0.36, "learning_rate": 3.6738440196225828e-06, "loss": 1.0162, "step": 12086 }, { "epoch": 0.36, "learning_rate": 3.6736286539827072e-06, "loss": 1.2227, "step": 12087 }, { "epoch": 0.36, "learning_rate": 3.6734132771704523e-06, "loss": 1.1293, "step": 12088 }, { "epoch": 0.36, "learning_rate": 3.6731978891878678e-06, "loss": 1.1175, "step": 12089 }, { "epoch": 0.36, "learning_rate": 3.672982490037005e-06, "loss": 1.1279, "step": 12090 }, { "epoch": 0.36, "learning_rate": 3.672767079719913e-06, "loss": 1.1292, "step": 12091 }, { "epoch": 0.36, "learning_rate": 3.6725516582386435e-06, "loss": 1.1522, "step": 12092 }, { "epoch": 0.36, "learning_rate": 3.6723362255952473e-06, "loss": 1.0721, "step": 12093 }, { "epoch": 0.36, "learning_rate": 3.672120781791774e-06, "loss": 1.0703, "step": 12094 }, { "epoch": 0.36, "learning_rate": 3.671905326830277e-06, "loss": 1.0893, "step": 12095 }, { "epoch": 0.36, "learning_rate": 3.6716898607128045e-06, "loss": 1.1516, "step": 12096 }, { "epoch": 0.36, "learning_rate": 3.671474383441409e-06, "loss": 1.1382, "step": 12097 }, { "epoch": 0.36, "learning_rate": 3.6712588950181417e-06, "loss": 1.2064, "step": 12098 }, { "epoch": 0.36, "learning_rate": 3.6710433954450536e-06, "loss": 1.113, "step": 12099 }, { "epoch": 0.36, "learning_rate": 3.6708278847241962e-06, "loss": 1.2273, "step": 12100 }, { "epoch": 0.36, "learning_rate": 3.670612362857622e-06, "loss": 1.1591, "step": 12101 }, { "epoch": 0.36, "learning_rate": 3.6703968298473814e-06, "loss": 1.1731, "step": 12102 }, { "epoch": 0.36, "learning_rate": 3.670181285695527e-06, "loss": 1.1196, "step": 12103 }, { "epoch": 0.36, "learning_rate": 3.6699657304041097e-06, "loss": 1.0895, "step": 12104 }, { "epoch": 0.36, "learning_rate": 3.6697501639751824e-06, "loss": 0.9976, "step": 12105 }, { "epoch": 0.36, "learning_rate": 3.6695345864107967e-06, "loss": 1.2487, "step": 12106 }, { "epoch": 0.36, "learning_rate": 3.669318997713005e-06, "loss": 1.218, "step": 12107 }, { "epoch": 0.36, "learning_rate": 3.6691033978838603e-06, "loss": 1.0377, "step": 12108 }, { "epoch": 0.36, "learning_rate": 3.6688877869254137e-06, "loss": 1.1801, "step": 12109 }, { "epoch": 0.36, "learning_rate": 3.6686721648397188e-06, "loss": 1.19, "step": 12110 }, { "epoch": 0.36, "learning_rate": 3.668456531628827e-06, "loss": 1.1859, "step": 12111 }, { "epoch": 0.36, "learning_rate": 3.668240887294793e-06, "loss": 1.2091, "step": 12112 }, { "epoch": 0.36, "learning_rate": 3.668025231839667e-06, "loss": 1.1073, "step": 12113 }, { "epoch": 0.36, "learning_rate": 3.6678095652655043e-06, "loss": 1.0967, "step": 12114 }, { "epoch": 0.36, "learning_rate": 3.6675938875743567e-06, "loss": 1.0527, "step": 12115 }, { "epoch": 0.36, "learning_rate": 3.6673781987682777e-06, "loss": 1.0594, "step": 12116 }, { "epoch": 0.37, "learning_rate": 3.6671624988493203e-06, "loss": 1.2198, "step": 12117 }, { "epoch": 0.37, "learning_rate": 3.6669467878195374e-06, "loss": 1.2333, "step": 12118 }, { "epoch": 0.37, "learning_rate": 3.6667310656809847e-06, "loss": 0.9609, "step": 12119 }, { "epoch": 0.37, "learning_rate": 3.6665153324357126e-06, "loss": 1.1454, "step": 12120 }, { "epoch": 0.37, "learning_rate": 3.666299588085777e-06, "loss": 1.1387, "step": 12121 }, { "epoch": 0.37, "learning_rate": 3.666083832633231e-06, "loss": 1.0291, "step": 12122 }, { "epoch": 0.37, "learning_rate": 3.665868066080129e-06, "loss": 1.1153, "step": 12123 }, { "epoch": 0.37, "learning_rate": 3.6656522884285233e-06, "loss": 1.1566, "step": 12124 }, { "epoch": 0.37, "learning_rate": 3.6654364996804703e-06, "loss": 1.1962, "step": 12125 }, { "epoch": 0.37, "learning_rate": 3.6652206998380225e-06, "loss": 1.2473, "step": 12126 }, { "epoch": 0.37, "learning_rate": 3.6650048889032357e-06, "loss": 1.1757, "step": 12127 }, { "epoch": 0.37, "learning_rate": 3.6647890668781627e-06, "loss": 1.1252, "step": 12128 }, { "epoch": 0.37, "learning_rate": 3.6645732337648587e-06, "loss": 1.0787, "step": 12129 }, { "epoch": 0.37, "learning_rate": 3.6643573895653787e-06, "loss": 1.0829, "step": 12130 }, { "epoch": 0.37, "learning_rate": 3.6641415342817777e-06, "loss": 1.1339, "step": 12131 }, { "epoch": 0.37, "learning_rate": 3.663925667916109e-06, "loss": 1.1903, "step": 12132 }, { "epoch": 0.37, "learning_rate": 3.6637097904704284e-06, "loss": 1.1218, "step": 12133 }, { "epoch": 0.37, "learning_rate": 3.6634939019467914e-06, "loss": 1.2089, "step": 12134 }, { "epoch": 0.37, "learning_rate": 3.6632780023472523e-06, "loss": 1.1068, "step": 12135 }, { "epoch": 0.37, "learning_rate": 3.663062091673868e-06, "loss": 1.2476, "step": 12136 }, { "epoch": 0.37, "learning_rate": 3.662846169928692e-06, "loss": 1.1475, "step": 12137 }, { "epoch": 0.37, "learning_rate": 3.6626302371137813e-06, "loss": 1.1169, "step": 12138 }, { "epoch": 0.37, "learning_rate": 3.6624142932311895e-06, "loss": 1.1588, "step": 12139 }, { "epoch": 0.37, "learning_rate": 3.662198338282974e-06, "loss": 1.0999, "step": 12140 }, { "epoch": 0.37, "learning_rate": 3.66198237227119e-06, "loss": 1.1643, "step": 12141 }, { "epoch": 0.37, "learning_rate": 3.6617663951978944e-06, "loss": 1.3273, "step": 12142 }, { "epoch": 0.37, "learning_rate": 3.661550407065141e-06, "loss": 1.2047, "step": 12143 }, { "epoch": 0.37, "learning_rate": 3.661334407874988e-06, "loss": 1.1976, "step": 12144 }, { "epoch": 0.37, "learning_rate": 3.6611183976294896e-06, "loss": 1.0639, "step": 12145 }, { "epoch": 0.37, "learning_rate": 3.660902376330704e-06, "loss": 1.194, "step": 12146 }, { "epoch": 0.37, "learning_rate": 3.6606863439806868e-06, "loss": 1.1146, "step": 12147 }, { "epoch": 0.37, "learning_rate": 3.660470300581494e-06, "loss": 1.2438, "step": 12148 }, { "epoch": 0.37, "learning_rate": 3.660254246135184e-06, "loss": 1.1953, "step": 12149 }, { "epoch": 0.37, "learning_rate": 3.6600381806438116e-06, "loss": 1.0836, "step": 12150 }, { "epoch": 0.37, "learning_rate": 3.659822104109435e-06, "loss": 1.1903, "step": 12151 }, { "epoch": 0.37, "learning_rate": 3.65960601653411e-06, "loss": 1.1344, "step": 12152 }, { "epoch": 0.37, "learning_rate": 3.659389917919895e-06, "loss": 1.2208, "step": 12153 }, { "epoch": 0.37, "learning_rate": 3.6591738082688456e-06, "loss": 1.1858, "step": 12154 }, { "epoch": 0.37, "learning_rate": 3.6589576875830204e-06, "loss": 1.1972, "step": 12155 }, { "epoch": 0.37, "learning_rate": 3.6587415558644758e-06, "loss": 1.0131, "step": 12156 }, { "epoch": 0.37, "learning_rate": 3.6585254131152693e-06, "loss": 1.1627, "step": 12157 }, { "epoch": 0.37, "learning_rate": 3.658309259337459e-06, "loss": 1.1787, "step": 12158 }, { "epoch": 0.37, "learning_rate": 3.658093094533103e-06, "loss": 1.2565, "step": 12159 }, { "epoch": 0.37, "learning_rate": 3.657876918704258e-06, "loss": 1.1953, "step": 12160 }, { "epoch": 0.37, "learning_rate": 3.657660731852982e-06, "loss": 1.1235, "step": 12161 }, { "epoch": 0.37, "learning_rate": 3.6574445339813342e-06, "loss": 1.1614, "step": 12162 }, { "epoch": 0.37, "learning_rate": 3.6572283250913708e-06, "loss": 1.0684, "step": 12163 }, { "epoch": 0.37, "learning_rate": 3.6570121051851526e-06, "loss": 1.1456, "step": 12164 }, { "epoch": 0.37, "learning_rate": 3.6567958742647354e-06, "loss": 1.1729, "step": 12165 }, { "epoch": 0.37, "learning_rate": 3.656579632332179e-06, "loss": 1.0927, "step": 12166 }, { "epoch": 0.37, "learning_rate": 3.6563633793895416e-06, "loss": 1.1754, "step": 12167 }, { "epoch": 0.37, "learning_rate": 3.6561471154388816e-06, "loss": 1.0781, "step": 12168 }, { "epoch": 0.37, "learning_rate": 3.6559308404822574e-06, "loss": 1.2152, "step": 12169 }, { "epoch": 0.37, "learning_rate": 3.655714554521729e-06, "loss": 1.1526, "step": 12170 }, { "epoch": 0.37, "learning_rate": 3.6554982575593546e-06, "loss": 1.148, "step": 12171 }, { "epoch": 0.37, "learning_rate": 3.6552819495971926e-06, "loss": 1.1469, "step": 12172 }, { "epoch": 0.37, "learning_rate": 3.6550656306373034e-06, "loss": 1.2238, "step": 12173 }, { "epoch": 0.37, "learning_rate": 3.6548493006817453e-06, "loss": 1.135, "step": 12174 }, { "epoch": 0.37, "learning_rate": 3.6546329597325784e-06, "loss": 1.1057, "step": 12175 }, { "epoch": 0.37, "learning_rate": 3.6544166077918618e-06, "loss": 1.1359, "step": 12176 }, { "epoch": 0.37, "learning_rate": 3.6542002448616554e-06, "loss": 1.1411, "step": 12177 }, { "epoch": 0.37, "learning_rate": 3.653983870944018e-06, "loss": 1.146, "step": 12178 }, { "epoch": 0.37, "learning_rate": 3.65376748604101e-06, "loss": 1.0867, "step": 12179 }, { "epoch": 0.37, "learning_rate": 3.653551090154691e-06, "loss": 1.2731, "step": 12180 }, { "epoch": 0.37, "learning_rate": 3.653334683287122e-06, "loss": 1.1625, "step": 12181 }, { "epoch": 0.37, "learning_rate": 3.6531182654403617e-06, "loss": 1.1696, "step": 12182 }, { "epoch": 0.37, "learning_rate": 3.6529018366164715e-06, "loss": 1.0809, "step": 12183 }, { "epoch": 0.37, "learning_rate": 3.65268539681751e-06, "loss": 1.0612, "step": 12184 }, { "epoch": 0.37, "learning_rate": 3.65246894604554e-06, "loss": 1.1229, "step": 12185 }, { "epoch": 0.37, "learning_rate": 3.6522524843026196e-06, "loss": 1.2239, "step": 12186 }, { "epoch": 0.37, "learning_rate": 3.6520360115908104e-06, "loss": 1.0961, "step": 12187 }, { "epoch": 0.37, "learning_rate": 3.6518195279121737e-06, "loss": 1.0964, "step": 12188 }, { "epoch": 0.37, "learning_rate": 3.6516030332687693e-06, "loss": 1.1643, "step": 12189 }, { "epoch": 0.37, "learning_rate": 3.651386527662659e-06, "loss": 1.1407, "step": 12190 }, { "epoch": 0.37, "learning_rate": 3.6511700110959036e-06, "loss": 1.1068, "step": 12191 }, { "epoch": 0.37, "learning_rate": 3.6509534835705646e-06, "loss": 1.1124, "step": 12192 }, { "epoch": 0.37, "learning_rate": 3.650736945088702e-06, "loss": 1.2238, "step": 12193 }, { "epoch": 0.37, "learning_rate": 3.6505203956523784e-06, "loss": 1.1207, "step": 12194 }, { "epoch": 0.37, "learning_rate": 3.6503038352636543e-06, "loss": 1.22, "step": 12195 }, { "epoch": 0.37, "learning_rate": 3.650087263924592e-06, "loss": 1.2013, "step": 12196 }, { "epoch": 0.37, "learning_rate": 3.649870681637253e-06, "loss": 1.1122, "step": 12197 }, { "epoch": 0.37, "learning_rate": 3.649654088403699e-06, "loss": 1.1156, "step": 12198 }, { "epoch": 0.37, "learning_rate": 3.649437484225991e-06, "loss": 1.1447, "step": 12199 }, { "epoch": 0.37, "learning_rate": 3.649220869106192e-06, "loss": 1.0284, "step": 12200 }, { "epoch": 0.37, "learning_rate": 3.6490042430463644e-06, "loss": 1.1149, "step": 12201 }, { "epoch": 0.37, "learning_rate": 3.6487876060485687e-06, "loss": 1.1354, "step": 12202 }, { "epoch": 0.37, "learning_rate": 3.6485709581148687e-06, "loss": 1.083, "step": 12203 }, { "epoch": 0.37, "learning_rate": 3.6483542992473264e-06, "loss": 0.9887, "step": 12204 }, { "epoch": 0.37, "learning_rate": 3.6481376294480053e-06, "loss": 1.2346, "step": 12205 }, { "epoch": 0.37, "learning_rate": 3.6479209487189654e-06, "loss": 1.1793, "step": 12206 }, { "epoch": 0.37, "learning_rate": 3.647704257062272e-06, "loss": 1.1788, "step": 12207 }, { "epoch": 0.37, "learning_rate": 3.647487554479986e-06, "loss": 1.2413, "step": 12208 }, { "epoch": 0.37, "learning_rate": 3.647270840974172e-06, "loss": 1.0497, "step": 12209 }, { "epoch": 0.37, "learning_rate": 3.6470541165468913e-06, "loss": 1.1605, "step": 12210 }, { "epoch": 0.37, "learning_rate": 3.646837381200209e-06, "loss": 1.1663, "step": 12211 }, { "epoch": 0.37, "learning_rate": 3.6466206349361853e-06, "loss": 1.1798, "step": 12212 }, { "epoch": 0.37, "learning_rate": 3.6464038777568865e-06, "loss": 1.1712, "step": 12213 }, { "epoch": 0.37, "learning_rate": 3.6461871096643754e-06, "loss": 1.1076, "step": 12214 }, { "epoch": 0.37, "learning_rate": 3.645970330660714e-06, "loss": 1.0457, "step": 12215 }, { "epoch": 0.37, "learning_rate": 3.6457535407479677e-06, "loss": 1.1397, "step": 12216 }, { "epoch": 0.37, "learning_rate": 3.6455367399281987e-06, "loss": 1.1672, "step": 12217 }, { "epoch": 0.37, "learning_rate": 3.645319928203473e-06, "loss": 1.2368, "step": 12218 }, { "epoch": 0.37, "learning_rate": 3.645103105575852e-06, "loss": 1.1968, "step": 12219 }, { "epoch": 0.37, "learning_rate": 3.6448862720474014e-06, "loss": 1.0892, "step": 12220 }, { "epoch": 0.37, "learning_rate": 3.644669427620185e-06, "loss": 1.1362, "step": 12221 }, { "epoch": 0.37, "learning_rate": 3.644452572296267e-06, "loss": 1.1425, "step": 12222 }, { "epoch": 0.37, "learning_rate": 3.644235706077711e-06, "loss": 1.1555, "step": 12223 }, { "epoch": 0.37, "learning_rate": 3.6440188289665835e-06, "loss": 1.184, "step": 12224 }, { "epoch": 0.37, "learning_rate": 3.6438019409649463e-06, "loss": 1.1549, "step": 12225 }, { "epoch": 0.37, "learning_rate": 3.6435850420748657e-06, "loss": 1.0859, "step": 12226 }, { "epoch": 0.37, "learning_rate": 3.6433681322984073e-06, "loss": 1.114, "step": 12227 }, { "epoch": 0.37, "learning_rate": 3.643151211637634e-06, "loss": 1.2493, "step": 12228 }, { "epoch": 0.37, "learning_rate": 3.6429342800946116e-06, "loss": 1.1893, "step": 12229 }, { "epoch": 0.37, "learning_rate": 3.6427173376714053e-06, "loss": 1.1926, "step": 12230 }, { "epoch": 0.37, "learning_rate": 3.6425003843700814e-06, "loss": 1.19, "step": 12231 }, { "epoch": 0.37, "learning_rate": 3.6422834201927032e-06, "loss": 1.0647, "step": 12232 }, { "epoch": 0.37, "learning_rate": 3.642066445141337e-06, "loss": 1.2833, "step": 12233 }, { "epoch": 0.37, "learning_rate": 3.6418494592180487e-06, "loss": 1.0999, "step": 12234 }, { "epoch": 0.37, "learning_rate": 3.6416324624249033e-06, "loss": 1.2614, "step": 12235 }, { "epoch": 0.37, "learning_rate": 3.641415454763967e-06, "loss": 1.0389, "step": 12236 }, { "epoch": 0.37, "learning_rate": 3.641198436237305e-06, "loss": 1.198, "step": 12237 }, { "epoch": 0.37, "learning_rate": 3.640981406846983e-06, "loss": 1.2281, "step": 12238 }, { "epoch": 0.37, "learning_rate": 3.640764366595068e-06, "loss": 1.1489, "step": 12239 }, { "epoch": 0.37, "learning_rate": 3.6405473154836257e-06, "loss": 1.1187, "step": 12240 }, { "epoch": 0.37, "learning_rate": 3.640330253514722e-06, "loss": 1.0682, "step": 12241 }, { "epoch": 0.37, "learning_rate": 3.6401131806904234e-06, "loss": 1.2128, "step": 12242 }, { "epoch": 0.37, "learning_rate": 3.639896097012797e-06, "loss": 1.21, "step": 12243 }, { "epoch": 0.37, "learning_rate": 3.6396790024839077e-06, "loss": 1.1714, "step": 12244 }, { "epoch": 0.37, "learning_rate": 3.6394618971058243e-06, "loss": 1.1255, "step": 12245 }, { "epoch": 0.37, "learning_rate": 3.639244780880612e-06, "loss": 1.1263, "step": 12246 }, { "epoch": 0.37, "learning_rate": 3.6390276538103383e-06, "loss": 1.1681, "step": 12247 }, { "epoch": 0.37, "learning_rate": 3.63881051589707e-06, "loss": 1.1916, "step": 12248 }, { "epoch": 0.37, "learning_rate": 3.6385933671428732e-06, "loss": 1.1273, "step": 12249 }, { "epoch": 0.37, "learning_rate": 3.638376207549817e-06, "loss": 1.1255, "step": 12250 }, { "epoch": 0.37, "learning_rate": 3.6381590371199667e-06, "loss": 1.0791, "step": 12251 }, { "epoch": 0.37, "learning_rate": 3.637941855855391e-06, "loss": 1.1346, "step": 12252 }, { "epoch": 0.37, "learning_rate": 3.6377246637581564e-06, "loss": 0.9947, "step": 12253 }, { "epoch": 0.37, "learning_rate": 3.6375074608303314e-06, "loss": 1.1168, "step": 12254 }, { "epoch": 0.37, "learning_rate": 3.6372902470739834e-06, "loss": 1.2406, "step": 12255 }, { "epoch": 0.37, "learning_rate": 3.6370730224911792e-06, "loss": 1.1238, "step": 12256 }, { "epoch": 0.37, "learning_rate": 3.636855787083988e-06, "loss": 1.0399, "step": 12257 }, { "epoch": 0.37, "learning_rate": 3.6366385408544768e-06, "loss": 1.0781, "step": 12258 }, { "epoch": 0.37, "learning_rate": 3.6364212838047154e-06, "loss": 1.0507, "step": 12259 }, { "epoch": 0.37, "learning_rate": 3.636204015936769e-06, "loss": 1.1289, "step": 12260 }, { "epoch": 0.37, "learning_rate": 3.635986737252709e-06, "loss": 1.1435, "step": 12261 }, { "epoch": 0.37, "learning_rate": 3.635769447754601e-06, "loss": 1.1508, "step": 12262 }, { "epoch": 0.37, "learning_rate": 3.6355521474445167e-06, "loss": 1.1956, "step": 12263 }, { "epoch": 0.37, "learning_rate": 3.635334836324521e-06, "loss": 1.2203, "step": 12264 }, { "epoch": 0.37, "learning_rate": 3.6351175143966854e-06, "loss": 1.209, "step": 12265 }, { "epoch": 0.37, "learning_rate": 3.6349001816630776e-06, "loss": 1.1381, "step": 12266 }, { "epoch": 0.37, "learning_rate": 3.6346828381257665e-06, "loss": 1.0688, "step": 12267 }, { "epoch": 0.37, "learning_rate": 3.6344654837868215e-06, "loss": 1.2382, "step": 12268 }, { "epoch": 0.37, "learning_rate": 3.6342481186483115e-06, "loss": 1.1426, "step": 12269 }, { "epoch": 0.37, "learning_rate": 3.634030742712305e-06, "loss": 1.2439, "step": 12270 }, { "epoch": 0.37, "learning_rate": 3.6338133559808723e-06, "loss": 1.0554, "step": 12271 }, { "epoch": 0.37, "learning_rate": 3.633595958456083e-06, "loss": 1.0665, "step": 12272 }, { "epoch": 0.37, "learning_rate": 3.6333785501400058e-06, "loss": 1.1827, "step": 12273 }, { "epoch": 0.37, "learning_rate": 3.6331611310347113e-06, "loss": 1.1652, "step": 12274 }, { "epoch": 0.37, "learning_rate": 3.6329437011422677e-06, "loss": 1.0258, "step": 12275 }, { "epoch": 0.37, "learning_rate": 3.632726260464746e-06, "loss": 1.1655, "step": 12276 }, { "epoch": 0.37, "learning_rate": 3.632508809004216e-06, "loss": 1.0211, "step": 12277 }, { "epoch": 0.37, "learning_rate": 3.632291346762748e-06, "loss": 1.1124, "step": 12278 }, { "epoch": 0.37, "learning_rate": 3.632073873742411e-06, "loss": 1.0954, "step": 12279 }, { "epoch": 0.37, "learning_rate": 3.6318563899452756e-06, "loss": 1.1771, "step": 12280 }, { "epoch": 0.37, "learning_rate": 3.6316388953734135e-06, "loss": 1.1286, "step": 12281 }, { "epoch": 0.37, "learning_rate": 3.631421390028893e-06, "loss": 1.1547, "step": 12282 }, { "epoch": 0.37, "learning_rate": 3.631203873913787e-06, "loss": 1.0486, "step": 12283 }, { "epoch": 0.37, "learning_rate": 3.6309863470301643e-06, "loss": 1.1062, "step": 12284 }, { "epoch": 0.37, "learning_rate": 3.6307688093800957e-06, "loss": 1.0222, "step": 12285 }, { "epoch": 0.37, "learning_rate": 3.6305512609656534e-06, "loss": 1.0738, "step": 12286 }, { "epoch": 0.37, "learning_rate": 3.6303337017889074e-06, "loss": 1.1357, "step": 12287 }, { "epoch": 0.37, "learning_rate": 3.630116131851929e-06, "loss": 1.0372, "step": 12288 }, { "epoch": 0.37, "learning_rate": 3.6298985511567897e-06, "loss": 1.1125, "step": 12289 }, { "epoch": 0.37, "learning_rate": 3.629680959705559e-06, "loss": 1.0859, "step": 12290 }, { "epoch": 0.37, "learning_rate": 3.629463357500311e-06, "loss": 1.0981, "step": 12291 }, { "epoch": 0.37, "learning_rate": 3.6292457445431157e-06, "loss": 1.0484, "step": 12292 }, { "epoch": 0.37, "learning_rate": 3.6290281208360446e-06, "loss": 1.1016, "step": 12293 }, { "epoch": 0.37, "learning_rate": 3.6288104863811695e-06, "loss": 1.0958, "step": 12294 }, { "epoch": 0.37, "learning_rate": 3.6285928411805616e-06, "loss": 1.0773, "step": 12295 }, { "epoch": 0.37, "learning_rate": 3.6283751852362946e-06, "loss": 1.2026, "step": 12296 }, { "epoch": 0.37, "learning_rate": 3.628157518550438e-06, "loss": 1.1691, "step": 12297 }, { "epoch": 0.37, "learning_rate": 3.627939841125066e-06, "loss": 1.1084, "step": 12298 }, { "epoch": 0.37, "learning_rate": 3.6277221529622497e-06, "loss": 1.2235, "step": 12299 }, { "epoch": 0.37, "learning_rate": 3.627504454064062e-06, "loss": 1.2161, "step": 12300 }, { "epoch": 0.37, "learning_rate": 3.6272867444325744e-06, "loss": 1.1578, "step": 12301 }, { "epoch": 0.37, "learning_rate": 3.62706902406986e-06, "loss": 1.177, "step": 12302 }, { "epoch": 0.37, "learning_rate": 3.6268512929779913e-06, "loss": 1.0402, "step": 12303 }, { "epoch": 0.37, "learning_rate": 3.626633551159041e-06, "loss": 1.2166, "step": 12304 }, { "epoch": 0.37, "learning_rate": 3.6264157986150823e-06, "loss": 1.1365, "step": 12305 }, { "epoch": 0.37, "learning_rate": 3.6261980353481876e-06, "loss": 1.2209, "step": 12306 }, { "epoch": 0.37, "learning_rate": 3.62598026136043e-06, "loss": 1.0623, "step": 12307 }, { "epoch": 0.37, "learning_rate": 3.625762476653882e-06, "loss": 1.0901, "step": 12308 }, { "epoch": 0.37, "learning_rate": 3.6255446812306183e-06, "loss": 1.1322, "step": 12309 }, { "epoch": 0.37, "learning_rate": 3.6253268750927107e-06, "loss": 1.1544, "step": 12310 }, { "epoch": 0.37, "learning_rate": 3.6251090582422326e-06, "loss": 1.1238, "step": 12311 }, { "epoch": 0.37, "learning_rate": 3.624891230681259e-06, "loss": 1.1094, "step": 12312 }, { "epoch": 0.37, "learning_rate": 3.624673392411863e-06, "loss": 1.14, "step": 12313 }, { "epoch": 0.37, "learning_rate": 3.6244555434361173e-06, "loss": 1.0953, "step": 12314 }, { "epoch": 0.37, "learning_rate": 3.6242376837560967e-06, "loss": 1.0691, "step": 12315 }, { "epoch": 0.37, "learning_rate": 3.6240198133738746e-06, "loss": 1.1116, "step": 12316 }, { "epoch": 0.37, "learning_rate": 3.623801932291525e-06, "loss": 1.2587, "step": 12317 }, { "epoch": 0.37, "learning_rate": 3.6235840405111226e-06, "loss": 1.2123, "step": 12318 }, { "epoch": 0.37, "learning_rate": 3.623366138034741e-06, "loss": 1.1716, "step": 12319 }, { "epoch": 0.37, "learning_rate": 3.6231482248644557e-06, "loss": 1.1, "step": 12320 }, { "epoch": 0.37, "learning_rate": 3.6229303010023393e-06, "loss": 1.0953, "step": 12321 }, { "epoch": 0.37, "learning_rate": 3.6227123664504676e-06, "loss": 1.1802, "step": 12322 }, { "epoch": 0.37, "learning_rate": 3.6224944212109146e-06, "loss": 1.1478, "step": 12323 }, { "epoch": 0.37, "learning_rate": 3.6222764652857556e-06, "loss": 1.0317, "step": 12324 }, { "epoch": 0.37, "learning_rate": 3.6220584986770652e-06, "loss": 1.188, "step": 12325 }, { "epoch": 0.37, "learning_rate": 3.621840521386918e-06, "loss": 1.1674, "step": 12326 }, { "epoch": 0.37, "learning_rate": 3.6216225334173895e-06, "loss": 1.0129, "step": 12327 }, { "epoch": 0.37, "learning_rate": 3.621404534770555e-06, "loss": 1.1494, "step": 12328 }, { "epoch": 0.37, "learning_rate": 3.621186525448489e-06, "loss": 1.1321, "step": 12329 }, { "epoch": 0.37, "learning_rate": 3.6209685054532674e-06, "loss": 1.2148, "step": 12330 }, { "epoch": 0.37, "learning_rate": 3.6207504747869654e-06, "loss": 1.3036, "step": 12331 }, { "epoch": 0.37, "learning_rate": 3.6205324334516584e-06, "loss": 1.0821, "step": 12332 }, { "epoch": 0.37, "learning_rate": 3.620314381449423e-06, "loss": 1.08, "step": 12333 }, { "epoch": 0.37, "learning_rate": 3.6200963187823335e-06, "loss": 1.0784, "step": 12334 }, { "epoch": 0.37, "learning_rate": 3.6198782454524672e-06, "loss": 1.1465, "step": 12335 }, { "epoch": 0.37, "learning_rate": 3.6196601614618986e-06, "loss": 1.1937, "step": 12336 }, { "epoch": 0.37, "learning_rate": 3.6194420668127056e-06, "loss": 1.2167, "step": 12337 }, { "epoch": 0.37, "learning_rate": 3.6192239615069623e-06, "loss": 1.0833, "step": 12338 }, { "epoch": 0.37, "learning_rate": 3.6190058455467457e-06, "loss": 1.181, "step": 12339 }, { "epoch": 0.37, "learning_rate": 3.618787718934133e-06, "loss": 1.1902, "step": 12340 }, { "epoch": 0.37, "learning_rate": 3.6185695816712004e-06, "loss": 1.089, "step": 12341 }, { "epoch": 0.37, "learning_rate": 3.6183514337600235e-06, "loss": 1.1046, "step": 12342 }, { "epoch": 0.37, "learning_rate": 3.61813327520268e-06, "loss": 1.1824, "step": 12343 }, { "epoch": 0.37, "learning_rate": 3.6179151060012456e-06, "loss": 1.1183, "step": 12344 }, { "epoch": 0.37, "learning_rate": 3.6176969261577978e-06, "loss": 1.1425, "step": 12345 }, { "epoch": 0.37, "learning_rate": 3.6174787356744145e-06, "loss": 1.1496, "step": 12346 }, { "epoch": 0.37, "learning_rate": 3.617260534553171e-06, "loss": 1.1011, "step": 12347 }, { "epoch": 0.37, "learning_rate": 3.617042322796146e-06, "loss": 1.0813, "step": 12348 }, { "epoch": 0.37, "learning_rate": 3.616824100405415e-06, "loss": 1.1428, "step": 12349 }, { "epoch": 0.37, "learning_rate": 3.616605867383057e-06, "loss": 1.1527, "step": 12350 }, { "epoch": 0.37, "learning_rate": 3.616387623731149e-06, "loss": 1.0539, "step": 12351 }, { "epoch": 0.37, "learning_rate": 3.6161693694517684e-06, "loss": 1.097, "step": 12352 }, { "epoch": 0.37, "learning_rate": 3.615951104546993e-06, "loss": 1.0858, "step": 12353 }, { "epoch": 0.37, "learning_rate": 3.615732829018901e-06, "loss": 1.0938, "step": 12354 }, { "epoch": 0.37, "learning_rate": 3.615514542869569e-06, "loss": 1.1398, "step": 12355 }, { "epoch": 0.37, "learning_rate": 3.6152962461010765e-06, "loss": 1.0455, "step": 12356 }, { "epoch": 0.37, "learning_rate": 3.6150779387155003e-06, "loss": 1.1075, "step": 12357 }, { "epoch": 0.37, "learning_rate": 3.61485962071492e-06, "loss": 1.1603, "step": 12358 }, { "epoch": 0.37, "learning_rate": 3.6146412921014122e-06, "loss": 1.1244, "step": 12359 }, { "epoch": 0.37, "learning_rate": 3.6144229528770564e-06, "loss": 1.177, "step": 12360 }, { "epoch": 0.37, "learning_rate": 3.614204603043931e-06, "loss": 1.1126, "step": 12361 }, { "epoch": 0.37, "learning_rate": 3.613986242604114e-06, "loss": 1.2108, "step": 12362 }, { "epoch": 0.37, "learning_rate": 3.613767871559685e-06, "loss": 1.2134, "step": 12363 }, { "epoch": 0.37, "learning_rate": 3.613549489912722e-06, "loss": 1.1245, "step": 12364 }, { "epoch": 0.37, "learning_rate": 3.613331097665304e-06, "loss": 1.0144, "step": 12365 }, { "epoch": 0.37, "learning_rate": 3.6131126948195106e-06, "loss": 1.0989, "step": 12366 }, { "epoch": 0.37, "learning_rate": 3.6128942813774197e-06, "loss": 1.3331, "step": 12367 }, { "epoch": 0.37, "learning_rate": 3.6126758573411117e-06, "loss": 1.1478, "step": 12368 }, { "epoch": 0.37, "learning_rate": 3.6124574227126656e-06, "loss": 1.2028, "step": 12369 }, { "epoch": 0.37, "learning_rate": 3.61223897749416e-06, "loss": 1.1877, "step": 12370 }, { "epoch": 0.37, "learning_rate": 3.6120205216876757e-06, "loss": 1.1725, "step": 12371 }, { "epoch": 0.37, "learning_rate": 3.6118020552952916e-06, "loss": 1.1371, "step": 12372 }, { "epoch": 0.37, "learning_rate": 3.611583578319087e-06, "loss": 1.1051, "step": 12373 }, { "epoch": 0.37, "learning_rate": 3.6113650907611426e-06, "loss": 1.1483, "step": 12374 }, { "epoch": 0.37, "learning_rate": 3.6111465926235366e-06, "loss": 1.1085, "step": 12375 }, { "epoch": 0.37, "learning_rate": 3.6109280839083517e-06, "loss": 1.0294, "step": 12376 }, { "epoch": 0.37, "learning_rate": 3.6107095646176653e-06, "loss": 1.0939, "step": 12377 }, { "epoch": 0.37, "learning_rate": 3.6104910347535598e-06, "loss": 1.0613, "step": 12378 }, { "epoch": 0.37, "learning_rate": 3.6102724943181133e-06, "loss": 1.1254, "step": 12379 }, { "epoch": 0.37, "learning_rate": 3.610053943313408e-06, "loss": 1.1762, "step": 12380 }, { "epoch": 0.37, "learning_rate": 3.6098353817415236e-06, "loss": 1.1996, "step": 12381 }, { "epoch": 0.37, "learning_rate": 3.6096168096045414e-06, "loss": 1.0309, "step": 12382 }, { "epoch": 0.37, "learning_rate": 3.6093982269045412e-06, "loss": 1.1242, "step": 12383 }, { "epoch": 0.37, "learning_rate": 3.6091796336436047e-06, "loss": 1.1802, "step": 12384 }, { "epoch": 0.37, "learning_rate": 3.6089610298238116e-06, "loss": 1.1758, "step": 12385 }, { "epoch": 0.37, "learning_rate": 3.6087424154472432e-06, "loss": 1.1704, "step": 12386 }, { "epoch": 0.37, "learning_rate": 3.608523790515982e-06, "loss": 1.2847, "step": 12387 }, { "epoch": 0.37, "learning_rate": 3.608305155032108e-06, "loss": 1.1306, "step": 12388 }, { "epoch": 0.37, "learning_rate": 3.6080865089977023e-06, "loss": 1.1157, "step": 12389 }, { "epoch": 0.37, "learning_rate": 3.6078678524148467e-06, "loss": 1.1677, "step": 12390 }, { "epoch": 0.37, "learning_rate": 3.6076491852856233e-06, "loss": 1.0076, "step": 12391 }, { "epoch": 0.37, "learning_rate": 3.607430507612113e-06, "loss": 1.2226, "step": 12392 }, { "epoch": 0.37, "learning_rate": 3.6072118193963968e-06, "loss": 1.1808, "step": 12393 }, { "epoch": 0.37, "learning_rate": 3.606993120640558e-06, "loss": 1.0797, "step": 12394 }, { "epoch": 0.37, "learning_rate": 3.606774411346678e-06, "loss": 1.1646, "step": 12395 }, { "epoch": 0.37, "learning_rate": 3.606555691516838e-06, "loss": 1.1723, "step": 12396 }, { "epoch": 0.37, "learning_rate": 3.6063369611531213e-06, "loss": 1.087, "step": 12397 }, { "epoch": 0.37, "learning_rate": 3.6061182202576095e-06, "loss": 1.1599, "step": 12398 }, { "epoch": 0.37, "learning_rate": 3.6058994688323846e-06, "loss": 1.1031, "step": 12399 }, { "epoch": 0.37, "learning_rate": 3.6056807068795295e-06, "loss": 1.1719, "step": 12400 }, { "epoch": 0.37, "learning_rate": 3.6054619344011267e-06, "loss": 1.1252, "step": 12401 }, { "epoch": 0.37, "learning_rate": 3.6052431513992593e-06, "loss": 1.2201, "step": 12402 }, { "epoch": 0.37, "learning_rate": 3.6050243578760086e-06, "loss": 1.1695, "step": 12403 }, { "epoch": 0.37, "learning_rate": 3.6048055538334587e-06, "loss": 1.1024, "step": 12404 }, { "epoch": 0.37, "learning_rate": 3.6045867392736916e-06, "loss": 1.0978, "step": 12405 }, { "epoch": 0.37, "learning_rate": 3.604367914198791e-06, "loss": 1.1492, "step": 12406 }, { "epoch": 0.37, "learning_rate": 3.60414907861084e-06, "loss": 1.1241, "step": 12407 }, { "epoch": 0.37, "learning_rate": 3.6039302325119208e-06, "loss": 1.0602, "step": 12408 }, { "epoch": 0.37, "learning_rate": 3.6037113759041177e-06, "loss": 1.0582, "step": 12409 }, { "epoch": 0.37, "learning_rate": 3.603492508789514e-06, "loss": 1.2258, "step": 12410 }, { "epoch": 0.37, "learning_rate": 3.6032736311701927e-06, "loss": 1.1405, "step": 12411 }, { "epoch": 0.37, "learning_rate": 3.603054743048238e-06, "loss": 0.9793, "step": 12412 }, { "epoch": 0.37, "learning_rate": 3.602835844425734e-06, "loss": 1.0823, "step": 12413 }, { "epoch": 0.37, "learning_rate": 3.602616935304763e-06, "loss": 1.1096, "step": 12414 }, { "epoch": 0.37, "learning_rate": 3.6023980156874106e-06, "loss": 1.0665, "step": 12415 }, { "epoch": 0.37, "learning_rate": 3.6021790855757595e-06, "loss": 1.1306, "step": 12416 }, { "epoch": 0.37, "learning_rate": 3.6019601449718948e-06, "loss": 1.1257, "step": 12417 }, { "epoch": 0.37, "learning_rate": 3.6017411938779e-06, "loss": 1.1445, "step": 12418 }, { "epoch": 0.37, "learning_rate": 3.60152223229586e-06, "loss": 1.0715, "step": 12419 }, { "epoch": 0.37, "learning_rate": 3.601303260227858e-06, "loss": 1.1312, "step": 12420 }, { "epoch": 0.37, "learning_rate": 3.6010842776759795e-06, "loss": 1.0476, "step": 12421 }, { "epoch": 0.37, "learning_rate": 3.6008652846423093e-06, "loss": 1.1331, "step": 12422 }, { "epoch": 0.37, "learning_rate": 3.6006462811289323e-06, "loss": 1.1312, "step": 12423 }, { "epoch": 0.37, "learning_rate": 3.600427267137932e-06, "loss": 1.1854, "step": 12424 }, { "epoch": 0.37, "learning_rate": 3.600208242671394e-06, "loss": 1.1505, "step": 12425 }, { "epoch": 0.37, "learning_rate": 3.5999892077314042e-06, "loss": 1.1487, "step": 12426 }, { "epoch": 0.37, "learning_rate": 3.5997701623200465e-06, "loss": 1.1946, "step": 12427 }, { "epoch": 0.37, "learning_rate": 3.599551106439407e-06, "loss": 1.0819, "step": 12428 }, { "epoch": 0.37, "learning_rate": 3.5993320400915695e-06, "loss": 1.1003, "step": 12429 }, { "epoch": 0.37, "learning_rate": 3.5991129632786214e-06, "loss": 1.1302, "step": 12430 }, { "epoch": 0.37, "learning_rate": 3.5988938760026463e-06, "loss": 1.2175, "step": 12431 }, { "epoch": 0.37, "learning_rate": 3.5986747782657317e-06, "loss": 1.2223, "step": 12432 }, { "epoch": 0.37, "learning_rate": 3.598455670069962e-06, "loss": 1.1357, "step": 12433 }, { "epoch": 0.37, "learning_rate": 3.598236551417423e-06, "loss": 1.0928, "step": 12434 }, { "epoch": 0.37, "learning_rate": 3.598017422310201e-06, "loss": 1.1297, "step": 12435 }, { "epoch": 0.37, "learning_rate": 3.5977982827503827e-06, "loss": 1.2681, "step": 12436 }, { "epoch": 0.37, "learning_rate": 3.597579132740053e-06, "loss": 1.0499, "step": 12437 }, { "epoch": 0.37, "learning_rate": 3.597359972281298e-06, "loss": 1.2749, "step": 12438 }, { "epoch": 0.37, "learning_rate": 3.5971408013762054e-06, "loss": 1.287, "step": 12439 }, { "epoch": 0.37, "learning_rate": 3.59692162002686e-06, "loss": 1.1264, "step": 12440 }, { "epoch": 0.37, "learning_rate": 3.5967024282353504e-06, "loss": 1.1444, "step": 12441 }, { "epoch": 0.37, "learning_rate": 3.596483226003761e-06, "loss": 1.0738, "step": 12442 }, { "epoch": 0.37, "learning_rate": 3.59626401333418e-06, "loss": 1.3298, "step": 12443 }, { "epoch": 0.37, "learning_rate": 3.596044790228692e-06, "loss": 1.1602, "step": 12444 }, { "epoch": 0.37, "learning_rate": 3.595825556689387e-06, "loss": 1.1285, "step": 12445 }, { "epoch": 0.37, "learning_rate": 3.5956063127183495e-06, "loss": 1.1315, "step": 12446 }, { "epoch": 0.37, "learning_rate": 3.595387058317668e-06, "loss": 1.0502, "step": 12447 }, { "epoch": 0.37, "learning_rate": 3.59516779348943e-06, "loss": 1.1444, "step": 12448 }, { "epoch": 0.38, "learning_rate": 3.594948518235721e-06, "loss": 1.1342, "step": 12449 }, { "epoch": 0.38, "learning_rate": 3.594729232558629e-06, "loss": 1.1294, "step": 12450 }, { "epoch": 0.38, "learning_rate": 3.594509936460243e-06, "loss": 1.1654, "step": 12451 }, { "epoch": 0.38, "learning_rate": 3.5942906299426492e-06, "loss": 1.178, "step": 12452 }, { "epoch": 0.38, "learning_rate": 3.594071313007936e-06, "loss": 1.0925, "step": 12453 }, { "epoch": 0.38, "learning_rate": 3.5938519856581906e-06, "loss": 1.0681, "step": 12454 }, { "epoch": 0.38, "learning_rate": 3.5936326478955007e-06, "loss": 1.2289, "step": 12455 }, { "epoch": 0.38, "learning_rate": 3.5934132997219552e-06, "loss": 1.1204, "step": 12456 }, { "epoch": 0.38, "learning_rate": 3.593193941139641e-06, "loss": 1.025, "step": 12457 }, { "epoch": 0.38, "learning_rate": 3.592974572150648e-06, "loss": 1.1111, "step": 12458 }, { "epoch": 0.38, "learning_rate": 3.592755192757063e-06, "loss": 1.1743, "step": 12459 }, { "epoch": 0.38, "learning_rate": 3.5925358029609745e-06, "loss": 1.1562, "step": 12460 }, { "epoch": 0.38, "learning_rate": 3.592316402764472e-06, "loss": 1.1683, "step": 12461 }, { "epoch": 0.38, "learning_rate": 3.592096992169643e-06, "loss": 1.2518, "step": 12462 }, { "epoch": 0.38, "learning_rate": 3.5918775711785765e-06, "loss": 1.2887, "step": 12463 }, { "epoch": 0.38, "learning_rate": 3.5916581397933613e-06, "loss": 1.1059, "step": 12464 }, { "epoch": 0.38, "learning_rate": 3.591438698016087e-06, "loss": 1.1776, "step": 12465 }, { "epoch": 0.38, "learning_rate": 3.5912192458488416e-06, "loss": 1.0381, "step": 12466 }, { "epoch": 0.38, "learning_rate": 3.5909997832937144e-06, "loss": 1.1527, "step": 12467 }, { "epoch": 0.38, "learning_rate": 3.590780310352795e-06, "loss": 1.0754, "step": 12468 }, { "epoch": 0.38, "learning_rate": 3.590560827028172e-06, "loss": 1.1879, "step": 12469 }, { "epoch": 0.38, "learning_rate": 3.5903413333219357e-06, "loss": 1.1945, "step": 12470 }, { "epoch": 0.38, "learning_rate": 3.5901218292361744e-06, "loss": 1.0941, "step": 12471 }, { "epoch": 0.38, "learning_rate": 3.5899023147729784e-06, "loss": 1.0605, "step": 12472 }, { "epoch": 0.38, "learning_rate": 3.5896827899344377e-06, "loss": 1.1901, "step": 12473 }, { "epoch": 0.38, "learning_rate": 3.5894632547226415e-06, "loss": 1.0938, "step": 12474 }, { "epoch": 0.38, "learning_rate": 3.58924370913968e-06, "loss": 1.1437, "step": 12475 }, { "epoch": 0.38, "learning_rate": 3.5890241531876425e-06, "loss": 1.1064, "step": 12476 }, { "epoch": 0.38, "learning_rate": 3.58880458686862e-06, "loss": 1.2241, "step": 12477 }, { "epoch": 0.38, "learning_rate": 3.5885850101847018e-06, "loss": 1.1407, "step": 12478 }, { "epoch": 0.38, "learning_rate": 3.588365423137978e-06, "loss": 1.1085, "step": 12479 }, { "epoch": 0.38, "learning_rate": 3.5881458257305415e-06, "loss": 1.194, "step": 12480 }, { "epoch": 0.38, "learning_rate": 3.5879262179644793e-06, "loss": 1.1242, "step": 12481 }, { "epoch": 0.38, "learning_rate": 3.5877065998418837e-06, "loss": 1.0776, "step": 12482 }, { "epoch": 0.38, "learning_rate": 3.5874869713648453e-06, "loss": 1.0767, "step": 12483 }, { "epoch": 0.38, "learning_rate": 3.5872673325354544e-06, "loss": 1.0839, "step": 12484 }, { "epoch": 0.38, "learning_rate": 3.5870476833558025e-06, "loss": 1.187, "step": 12485 }, { "epoch": 0.38, "learning_rate": 3.586828023827981e-06, "loss": 1.1154, "step": 12486 }, { "epoch": 0.38, "learning_rate": 3.5866083539540787e-06, "loss": 1.1383, "step": 12487 }, { "epoch": 0.38, "learning_rate": 3.5863886737361885e-06, "loss": 1.1581, "step": 12488 }, { "epoch": 0.38, "learning_rate": 3.5861689831764017e-06, "loss": 1.2209, "step": 12489 }, { "epoch": 0.38, "learning_rate": 3.5859492822768088e-06, "loss": 1.057, "step": 12490 }, { "epoch": 0.38, "learning_rate": 3.5857295710395023e-06, "loss": 1.0992, "step": 12491 }, { "epoch": 0.38, "learning_rate": 3.5855098494665723e-06, "loss": 1.2119, "step": 12492 }, { "epoch": 0.38, "learning_rate": 3.5852901175601122e-06, "loss": 1.1857, "step": 12493 }, { "epoch": 0.38, "learning_rate": 3.5850703753222126e-06, "loss": 0.991, "step": 12494 }, { "epoch": 0.38, "learning_rate": 3.5848506227549664e-06, "loss": 1.1619, "step": 12495 }, { "epoch": 0.38, "learning_rate": 3.584630859860464e-06, "loss": 1.0284, "step": 12496 }, { "epoch": 0.38, "learning_rate": 3.5844110866407983e-06, "loss": 0.9839, "step": 12497 }, { "epoch": 0.38, "learning_rate": 3.5841913030980612e-06, "loss": 1.175, "step": 12498 }, { "epoch": 0.38, "learning_rate": 3.5839715092343454e-06, "loss": 1.0822, "step": 12499 }, { "epoch": 0.38, "learning_rate": 3.583751705051742e-06, "loss": 1.248, "step": 12500 }, { "epoch": 0.38, "learning_rate": 3.5835318905523455e-06, "loss": 1.1545, "step": 12501 }, { "epoch": 0.38, "learning_rate": 3.583312065738247e-06, "loss": 1.1305, "step": 12502 }, { "epoch": 0.38, "learning_rate": 3.5830922306115383e-06, "loss": 1.1902, "step": 12503 }, { "epoch": 0.38, "learning_rate": 3.582872385174314e-06, "loss": 1.1645, "step": 12504 }, { "epoch": 0.38, "learning_rate": 3.5826525294286657e-06, "loss": 1.0501, "step": 12505 }, { "epoch": 0.38, "learning_rate": 3.5824326633766876e-06, "loss": 1.0857, "step": 12506 }, { "epoch": 0.38, "learning_rate": 3.5822127870204716e-06, "loss": 1.1683, "step": 12507 }, { "epoch": 0.38, "learning_rate": 3.5819929003621107e-06, "loss": 1.1528, "step": 12508 }, { "epoch": 0.38, "learning_rate": 3.5817730034036986e-06, "loss": 1.0998, "step": 12509 }, { "epoch": 0.38, "learning_rate": 3.581553096147329e-06, "loss": 1.0237, "step": 12510 }, { "epoch": 0.38, "learning_rate": 3.5813331785950938e-06, "loss": 1.1207, "step": 12511 }, { "epoch": 0.38, "learning_rate": 3.5811132507490887e-06, "loss": 1.1367, "step": 12512 }, { "epoch": 0.38, "learning_rate": 3.5808933126114055e-06, "loss": 1.0913, "step": 12513 }, { "epoch": 0.38, "learning_rate": 3.5806733641841384e-06, "loss": 1.1518, "step": 12514 }, { "epoch": 0.38, "learning_rate": 3.5804534054693817e-06, "loss": 1.0828, "step": 12515 }, { "epoch": 0.38, "learning_rate": 3.5802334364692285e-06, "loss": 1.1261, "step": 12516 }, { "epoch": 0.38, "learning_rate": 3.580013457185774e-06, "loss": 1.2501, "step": 12517 }, { "epoch": 0.38, "learning_rate": 3.5797934676211103e-06, "loss": 1.219, "step": 12518 }, { "epoch": 0.38, "learning_rate": 3.579573467777334e-06, "loss": 1.1533, "step": 12519 }, { "epoch": 0.38, "learning_rate": 3.5793534576565374e-06, "loss": 1.1279, "step": 12520 }, { "epoch": 0.38, "learning_rate": 3.5791334372608165e-06, "loss": 1.1718, "step": 12521 }, { "epoch": 0.38, "learning_rate": 3.578913406592265e-06, "loss": 1.1394, "step": 12522 }, { "epoch": 0.38, "learning_rate": 3.578693365652977e-06, "loss": 1.1697, "step": 12523 }, { "epoch": 0.38, "learning_rate": 3.5784733144450477e-06, "loss": 1.1714, "step": 12524 }, { "epoch": 0.38, "learning_rate": 3.5782532529705722e-06, "loss": 1.2118, "step": 12525 }, { "epoch": 0.38, "learning_rate": 3.5780331812316447e-06, "loss": 1.1973, "step": 12526 }, { "epoch": 0.38, "learning_rate": 3.5778130992303612e-06, "loss": 1.1554, "step": 12527 }, { "epoch": 0.38, "learning_rate": 3.577593006968815e-06, "loss": 1.0536, "step": 12528 }, { "epoch": 0.38, "learning_rate": 3.577372904449103e-06, "loss": 1.1342, "step": 12529 }, { "epoch": 0.38, "learning_rate": 3.5771527916733194e-06, "loss": 1.1568, "step": 12530 }, { "epoch": 0.38, "learning_rate": 3.5769326686435607e-06, "loss": 1.1064, "step": 12531 }, { "epoch": 0.38, "learning_rate": 3.576712535361921e-06, "loss": 1.1357, "step": 12532 }, { "epoch": 0.38, "learning_rate": 3.5764923918304968e-06, "loss": 1.1164, "step": 12533 }, { "epoch": 0.38, "learning_rate": 3.576272238051384e-06, "loss": 1.1499, "step": 12534 }, { "epoch": 0.38, "learning_rate": 3.576052074026677e-06, "loss": 1.0696, "step": 12535 }, { "epoch": 0.38, "learning_rate": 3.575831899758473e-06, "loss": 1.158, "step": 12536 }, { "epoch": 0.38, "learning_rate": 3.5756117152488667e-06, "loss": 1.0806, "step": 12537 }, { "epoch": 0.38, "learning_rate": 3.5753915204999555e-06, "loss": 1.1331, "step": 12538 }, { "epoch": 0.38, "learning_rate": 3.575171315513835e-06, "loss": 1.0712, "step": 12539 }, { "epoch": 0.38, "learning_rate": 3.5749511002926017e-06, "loss": 1.1085, "step": 12540 }, { "epoch": 0.38, "learning_rate": 3.5747308748383515e-06, "loss": 1.083, "step": 12541 }, { "epoch": 0.38, "learning_rate": 3.574510639153181e-06, "loss": 1.1093, "step": 12542 }, { "epoch": 0.38, "learning_rate": 3.574290393239186e-06, "loss": 1.1823, "step": 12543 }, { "epoch": 0.38, "learning_rate": 3.5740701370984644e-06, "loss": 1.1915, "step": 12544 }, { "epoch": 0.38, "learning_rate": 3.5738498707331115e-06, "loss": 1.1727, "step": 12545 }, { "epoch": 0.38, "learning_rate": 3.573629594145226e-06, "loss": 1.0376, "step": 12546 }, { "epoch": 0.38, "learning_rate": 3.5734093073369035e-06, "loss": 1.0377, "step": 12547 }, { "epoch": 0.38, "learning_rate": 3.5731890103102416e-06, "loss": 1.0861, "step": 12548 }, { "epoch": 0.38, "learning_rate": 3.572968703067338e-06, "loss": 1.099, "step": 12549 }, { "epoch": 0.38, "learning_rate": 3.5727483856102874e-06, "loss": 1.0587, "step": 12550 }, { "epoch": 0.38, "learning_rate": 3.57252805794119e-06, "loss": 1.1573, "step": 12551 }, { "epoch": 0.38, "learning_rate": 3.5723077200621414e-06, "loss": 1.1428, "step": 12552 }, { "epoch": 0.38, "learning_rate": 3.5720873719752404e-06, "loss": 1.2992, "step": 12553 }, { "epoch": 0.38, "learning_rate": 3.5718670136825833e-06, "loss": 1.0422, "step": 12554 }, { "epoch": 0.38, "learning_rate": 3.5716466451862693e-06, "loss": 1.1763, "step": 12555 }, { "epoch": 0.38, "learning_rate": 3.5714262664883945e-06, "loss": 1.0751, "step": 12556 }, { "epoch": 0.38, "learning_rate": 3.571205877591058e-06, "loss": 1.0661, "step": 12557 }, { "epoch": 0.38, "learning_rate": 3.5709854784963573e-06, "loss": 1.1573, "step": 12558 }, { "epoch": 0.38, "learning_rate": 3.5707650692063906e-06, "loss": 1.1988, "step": 12559 }, { "epoch": 0.38, "learning_rate": 3.5705446497232565e-06, "loss": 1.2266, "step": 12560 }, { "epoch": 0.38, "learning_rate": 3.5703242200490522e-06, "loss": 1.1246, "step": 12561 }, { "epoch": 0.38, "learning_rate": 3.570103780185878e-06, "loss": 1.1796, "step": 12562 }, { "epoch": 0.38, "learning_rate": 3.5698833301358304e-06, "loss": 1.0385, "step": 12563 }, { "epoch": 0.38, "learning_rate": 3.569662869901009e-06, "loss": 1.1649, "step": 12564 }, { "epoch": 0.38, "learning_rate": 3.569442399483512e-06, "loss": 1.0692, "step": 12565 }, { "epoch": 0.38, "learning_rate": 3.569221918885439e-06, "loss": 1.1668, "step": 12566 }, { "epoch": 0.38, "learning_rate": 3.5690014281088875e-06, "loss": 1.2339, "step": 12567 }, { "epoch": 0.38, "learning_rate": 3.5687809271559582e-06, "loss": 1.1293, "step": 12568 }, { "epoch": 0.38, "learning_rate": 3.568560416028748e-06, "loss": 1.0173, "step": 12569 }, { "epoch": 0.38, "learning_rate": 3.568339894729358e-06, "loss": 1.0404, "step": 12570 }, { "epoch": 0.38, "learning_rate": 3.5681193632598865e-06, "loss": 1.1588, "step": 12571 }, { "epoch": 0.38, "learning_rate": 3.567898821622433e-06, "loss": 1.0924, "step": 12572 }, { "epoch": 0.38, "learning_rate": 3.567678269819097e-06, "loss": 1.0819, "step": 12573 }, { "epoch": 0.38, "learning_rate": 3.5674577078519785e-06, "loss": 1.1094, "step": 12574 }, { "epoch": 0.38, "learning_rate": 3.5672371357231765e-06, "loss": 1.1172, "step": 12575 }, { "epoch": 0.38, "learning_rate": 3.567016553434791e-06, "loss": 1.1651, "step": 12576 }, { "epoch": 0.38, "learning_rate": 3.5667959609889225e-06, "loss": 1.0901, "step": 12577 }, { "epoch": 0.38, "learning_rate": 3.5665753583876692e-06, "loss": 1.0991, "step": 12578 }, { "epoch": 0.38, "learning_rate": 3.5663547456331325e-06, "loss": 1.1486, "step": 12579 }, { "epoch": 0.38, "learning_rate": 3.5661341227274128e-06, "loss": 1.1891, "step": 12580 }, { "epoch": 0.38, "learning_rate": 3.5659134896726087e-06, "loss": 1.1631, "step": 12581 }, { "epoch": 0.38, "learning_rate": 3.5656928464708217e-06, "loss": 1.2069, "step": 12582 }, { "epoch": 0.38, "learning_rate": 3.5654721931241533e-06, "loss": 1.1671, "step": 12583 }, { "epoch": 0.38, "learning_rate": 3.565251529634701e-06, "loss": 1.0645, "step": 12584 }, { "epoch": 0.38, "learning_rate": 3.5650308560045683e-06, "loss": 1.1855, "step": 12585 }, { "epoch": 0.38, "learning_rate": 3.564810172235854e-06, "loss": 1.1104, "step": 12586 }, { "epoch": 0.38, "learning_rate": 3.56458947833066e-06, "loss": 1.1035, "step": 12587 }, { "epoch": 0.38, "learning_rate": 3.5643687742910877e-06, "loss": 1.0855, "step": 12588 }, { "epoch": 0.38, "learning_rate": 3.564148060119236e-06, "loss": 1.2375, "step": 12589 }, { "epoch": 0.38, "learning_rate": 3.563927335817209e-06, "loss": 1.1848, "step": 12590 }, { "epoch": 0.38, "learning_rate": 3.5637066013871046e-06, "loss": 0.9589, "step": 12591 }, { "epoch": 0.38, "learning_rate": 3.563485856831026e-06, "loss": 1.1115, "step": 12592 }, { "epoch": 0.38, "learning_rate": 3.5632651021510743e-06, "loss": 1.1166, "step": 12593 }, { "epoch": 0.38, "learning_rate": 3.5630443373493518e-06, "loss": 1.1119, "step": 12594 }, { "epoch": 0.38, "learning_rate": 3.5628235624279576e-06, "loss": 1.2274, "step": 12595 }, { "epoch": 0.38, "learning_rate": 3.5626027773889967e-06, "loss": 1.0874, "step": 12596 }, { "epoch": 0.38, "learning_rate": 3.562381982234567e-06, "loss": 1.1082, "step": 12597 }, { "epoch": 0.38, "learning_rate": 3.562161176966774e-06, "loss": 1.1705, "step": 12598 }, { "epoch": 0.38, "learning_rate": 3.561940361587718e-06, "loss": 1.1641, "step": 12599 }, { "epoch": 0.38, "learning_rate": 3.5617195360995004e-06, "loss": 1.0925, "step": 12600 }, { "epoch": 0.38, "learning_rate": 3.5614987005042252e-06, "loss": 1.1354, "step": 12601 }, { "epoch": 0.38, "learning_rate": 3.5612778548039927e-06, "loss": 1.0851, "step": 12602 }, { "epoch": 0.38, "learning_rate": 3.5610569990009077e-06, "loss": 1.0831, "step": 12603 }, { "epoch": 0.38, "learning_rate": 3.56083613309707e-06, "loss": 1.1599, "step": 12604 }, { "epoch": 0.38, "learning_rate": 3.5606152570945827e-06, "loss": 1.121, "step": 12605 }, { "epoch": 0.38, "learning_rate": 3.5603943709955495e-06, "loss": 1.0992, "step": 12606 }, { "epoch": 0.38, "learning_rate": 3.5601734748020732e-06, "loss": 1.1234, "step": 12607 }, { "epoch": 0.38, "learning_rate": 3.559952568516255e-06, "loss": 1.1631, "step": 12608 }, { "epoch": 0.38, "learning_rate": 3.5597316521401997e-06, "loss": 0.9899, "step": 12609 }, { "epoch": 0.38, "learning_rate": 3.5595107256760088e-06, "loss": 1.0768, "step": 12610 }, { "epoch": 0.38, "learning_rate": 3.559289789125786e-06, "loss": 1.0573, "step": 12611 }, { "epoch": 0.38, "learning_rate": 3.5590688424916346e-06, "loss": 1.2432, "step": 12612 }, { "epoch": 0.38, "learning_rate": 3.5588478857756586e-06, "loss": 1.3024, "step": 12613 }, { "epoch": 0.38, "learning_rate": 3.55862691897996e-06, "loss": 1.1677, "step": 12614 }, { "epoch": 0.38, "learning_rate": 3.558405942106643e-06, "loss": 1.1697, "step": 12615 }, { "epoch": 0.38, "learning_rate": 3.558184955157812e-06, "loss": 1.1329, "step": 12616 }, { "epoch": 0.38, "learning_rate": 3.557963958135569e-06, "loss": 1.2333, "step": 12617 }, { "epoch": 0.38, "learning_rate": 3.557742951042019e-06, "loss": 1.0948, "step": 12618 }, { "epoch": 0.38, "learning_rate": 3.5575219338792656e-06, "loss": 1.1879, "step": 12619 }, { "epoch": 0.38, "learning_rate": 3.5573009066494125e-06, "loss": 1.1331, "step": 12620 }, { "epoch": 0.38, "learning_rate": 3.5570798693545637e-06, "loss": 1.145, "step": 12621 }, { "epoch": 0.38, "learning_rate": 3.5568588219968246e-06, "loss": 1.0811, "step": 12622 }, { "epoch": 0.38, "learning_rate": 3.556637764578298e-06, "loss": 1.266, "step": 12623 }, { "epoch": 0.38, "learning_rate": 3.556416697101088e-06, "loss": 1.095, "step": 12624 }, { "epoch": 0.38, "learning_rate": 3.556195619567301e-06, "loss": 1.1003, "step": 12625 }, { "epoch": 0.38, "learning_rate": 3.5559745319790396e-06, "loss": 1.1427, "step": 12626 }, { "epoch": 0.38, "learning_rate": 3.5557534343384093e-06, "loss": 1.116, "step": 12627 }, { "epoch": 0.38, "learning_rate": 3.555532326647515e-06, "loss": 1.1571, "step": 12628 }, { "epoch": 0.38, "learning_rate": 3.555311208908462e-06, "loss": 1.158, "step": 12629 }, { "epoch": 0.38, "learning_rate": 3.5550900811233534e-06, "loss": 1.2047, "step": 12630 }, { "epoch": 0.38, "learning_rate": 3.5548689432942962e-06, "loss": 1.1459, "step": 12631 }, { "epoch": 0.38, "learning_rate": 3.5546477954233937e-06, "loss": 1.137, "step": 12632 }, { "epoch": 0.38, "learning_rate": 3.5544266375127533e-06, "loss": 1.1124, "step": 12633 }, { "epoch": 0.38, "learning_rate": 3.5542054695644785e-06, "loss": 1.1196, "step": 12634 }, { "epoch": 0.38, "learning_rate": 3.5539842915806755e-06, "loss": 1.1188, "step": 12635 }, { "epoch": 0.38, "learning_rate": 3.5537631035634496e-06, "loss": 1.2346, "step": 12636 }, { "epoch": 0.38, "learning_rate": 3.553541905514907e-06, "loss": 1.0797, "step": 12637 }, { "epoch": 0.38, "learning_rate": 3.553320697437152e-06, "loss": 1.0876, "step": 12638 }, { "epoch": 0.38, "learning_rate": 3.5530994793322917e-06, "loss": 1.0064, "step": 12639 }, { "epoch": 0.38, "learning_rate": 3.5528782512024306e-06, "loss": 1.0752, "step": 12640 }, { "epoch": 0.38, "learning_rate": 3.552657013049677e-06, "loss": 1.1032, "step": 12641 }, { "epoch": 0.38, "learning_rate": 3.5524357648761355e-06, "loss": 1.1923, "step": 12642 }, { "epoch": 0.38, "learning_rate": 3.5522145066839113e-06, "loss": 1.0286, "step": 12643 }, { "epoch": 0.38, "learning_rate": 3.5519932384751125e-06, "loss": 1.1705, "step": 12644 }, { "epoch": 0.38, "learning_rate": 3.551771960251845e-06, "loss": 1.1155, "step": 12645 }, { "epoch": 0.38, "learning_rate": 3.5515506720162146e-06, "loss": 1.1541, "step": 12646 }, { "epoch": 0.38, "learning_rate": 3.551329373770328e-06, "loss": 1.1961, "step": 12647 }, { "epoch": 0.38, "learning_rate": 3.5511080655162934e-06, "loss": 1.0679, "step": 12648 }, { "epoch": 0.38, "learning_rate": 3.550886747256215e-06, "loss": 1.1385, "step": 12649 }, { "epoch": 0.38, "learning_rate": 3.550665418992201e-06, "loss": 1.2548, "step": 12650 }, { "epoch": 0.38, "learning_rate": 3.5504440807263584e-06, "loss": 1.1277, "step": 12651 }, { "epoch": 0.38, "learning_rate": 3.550222732460794e-06, "loss": 1.1778, "step": 12652 }, { "epoch": 0.38, "learning_rate": 3.550001374197615e-06, "loss": 1.0812, "step": 12653 }, { "epoch": 0.38, "learning_rate": 3.5497800059389285e-06, "loss": 1.2609, "step": 12654 }, { "epoch": 0.38, "learning_rate": 3.5495586276868423e-06, "loss": 1.1895, "step": 12655 }, { "epoch": 0.38, "learning_rate": 3.5493372394434625e-06, "loss": 1.2906, "step": 12656 }, { "epoch": 0.38, "learning_rate": 3.5491158412108987e-06, "loss": 1.0495, "step": 12657 }, { "epoch": 0.38, "learning_rate": 3.5488944329912566e-06, "loss": 1.1799, "step": 12658 }, { "epoch": 0.38, "learning_rate": 3.5486730147866456e-06, "loss": 1.0574, "step": 12659 }, { "epoch": 0.38, "learning_rate": 3.548451586599172e-06, "loss": 1.1013, "step": 12660 }, { "epoch": 0.38, "learning_rate": 3.5482301484309444e-06, "loss": 1.0745, "step": 12661 }, { "epoch": 0.38, "learning_rate": 3.5480087002840702e-06, "loss": 1.1174, "step": 12662 }, { "epoch": 0.38, "learning_rate": 3.5477872421606587e-06, "loss": 1.2559, "step": 12663 }, { "epoch": 0.38, "learning_rate": 3.5475657740628162e-06, "loss": 1.1161, "step": 12664 }, { "epoch": 0.38, "learning_rate": 3.5473442959926525e-06, "loss": 1.108, "step": 12665 }, { "epoch": 0.38, "learning_rate": 3.5471228079522757e-06, "loss": 1.1876, "step": 12666 }, { "epoch": 0.38, "learning_rate": 3.5469013099437936e-06, "loss": 1.2356, "step": 12667 }, { "epoch": 0.38, "learning_rate": 3.546679801969316e-06, "loss": 1.1219, "step": 12668 }, { "epoch": 0.38, "learning_rate": 3.5464582840309503e-06, "loss": 1.0869, "step": 12669 }, { "epoch": 0.38, "learning_rate": 3.546236756130806e-06, "loss": 1.1838, "step": 12670 }, { "epoch": 0.38, "learning_rate": 3.546015218270991e-06, "loss": 1.1222, "step": 12671 }, { "epoch": 0.38, "learning_rate": 3.5457936704536155e-06, "loss": 1.0813, "step": 12672 }, { "epoch": 0.38, "learning_rate": 3.545572112680788e-06, "loss": 1.147, "step": 12673 }, { "epoch": 0.38, "learning_rate": 3.5453505449546177e-06, "loss": 1.1813, "step": 12674 }, { "epoch": 0.38, "learning_rate": 3.545128967277213e-06, "loss": 1.0887, "step": 12675 }, { "epoch": 0.38, "learning_rate": 3.544907379650685e-06, "loss": 1.097, "step": 12676 }, { "epoch": 0.38, "learning_rate": 3.5446857820771406e-06, "loss": 1.1533, "step": 12677 }, { "epoch": 0.38, "learning_rate": 3.5444641745586915e-06, "loss": 1.0654, "step": 12678 }, { "epoch": 0.38, "learning_rate": 3.5442425570974465e-06, "loss": 1.2966, "step": 12679 }, { "epoch": 0.38, "learning_rate": 3.5440209296955147e-06, "loss": 1.1907, "step": 12680 }, { "epoch": 0.38, "learning_rate": 3.543799292355007e-06, "loss": 1.1561, "step": 12681 }, { "epoch": 0.38, "learning_rate": 3.5435776450780324e-06, "loss": 1.0557, "step": 12682 }, { "epoch": 0.38, "learning_rate": 3.543355987866702e-06, "loss": 1.1025, "step": 12683 }, { "epoch": 0.38, "learning_rate": 3.543134320723124e-06, "loss": 1.1737, "step": 12684 }, { "epoch": 0.38, "learning_rate": 3.5429126436494106e-06, "loss": 1.098, "step": 12685 }, { "epoch": 0.38, "learning_rate": 3.5426909566476704e-06, "loss": 1.1094, "step": 12686 }, { "epoch": 0.38, "learning_rate": 3.542469259720015e-06, "loss": 1.3087, "step": 12687 }, { "epoch": 0.38, "learning_rate": 3.5422475528685542e-06, "loss": 1.1222, "step": 12688 }, { "epoch": 0.38, "learning_rate": 3.5420258360953986e-06, "loss": 1.0912, "step": 12689 }, { "epoch": 0.38, "learning_rate": 3.541804109402659e-06, "loss": 1.155, "step": 12690 }, { "epoch": 0.38, "learning_rate": 3.541582372792445e-06, "loss": 1.171, "step": 12691 }, { "epoch": 0.38, "learning_rate": 3.54136062626687e-06, "loss": 1.1652, "step": 12692 }, { "epoch": 0.38, "learning_rate": 3.5411388698280426e-06, "loss": 1.2458, "step": 12693 }, { "epoch": 0.38, "learning_rate": 3.5409171034780744e-06, "loss": 1.0707, "step": 12694 }, { "epoch": 0.38, "learning_rate": 3.5406953272190774e-06, "loss": 1.0299, "step": 12695 }, { "epoch": 0.38, "learning_rate": 3.5404735410531613e-06, "loss": 1.0509, "step": 12696 }, { "epoch": 0.38, "learning_rate": 3.5402517449824384e-06, "loss": 1.0428, "step": 12697 }, { "epoch": 0.38, "learning_rate": 3.5400299390090203e-06, "loss": 1.0981, "step": 12698 }, { "epoch": 0.38, "learning_rate": 3.539808123135018e-06, "loss": 1.1874, "step": 12699 }, { "epoch": 0.38, "learning_rate": 3.5395862973625433e-06, "loss": 1.2067, "step": 12700 }, { "epoch": 0.38, "learning_rate": 3.5393644616937074e-06, "loss": 1.0221, "step": 12701 }, { "epoch": 0.38, "learning_rate": 3.5391426161306224e-06, "loss": 1.1954, "step": 12702 }, { "epoch": 0.38, "learning_rate": 3.5389207606754e-06, "loss": 1.0615, "step": 12703 }, { "epoch": 0.38, "learning_rate": 3.5386988953301527e-06, "loss": 1.0917, "step": 12704 }, { "epoch": 0.38, "learning_rate": 3.538477020096992e-06, "loss": 1.0591, "step": 12705 }, { "epoch": 0.38, "learning_rate": 3.53825513497803e-06, "loss": 1.1688, "step": 12706 }, { "epoch": 0.38, "learning_rate": 3.53803323997538e-06, "loss": 0.9057, "step": 12707 }, { "epoch": 0.38, "learning_rate": 3.5378113350911526e-06, "loss": 1.1583, "step": 12708 }, { "epoch": 0.38, "learning_rate": 3.537589420327461e-06, "loss": 1.12, "step": 12709 }, { "epoch": 0.38, "learning_rate": 3.537367495686418e-06, "loss": 1.0471, "step": 12710 }, { "epoch": 0.38, "learning_rate": 3.5371455611701367e-06, "loss": 1.0917, "step": 12711 }, { "epoch": 0.38, "learning_rate": 3.5369236167807286e-06, "loss": 1.1197, "step": 12712 }, { "epoch": 0.38, "learning_rate": 3.5367016625203076e-06, "loss": 1.0759, "step": 12713 }, { "epoch": 0.38, "learning_rate": 3.5364796983909855e-06, "loss": 1.173, "step": 12714 }, { "epoch": 0.38, "learning_rate": 3.536257724394876e-06, "loss": 1.1839, "step": 12715 }, { "epoch": 0.38, "learning_rate": 3.5360357405340917e-06, "loss": 1.1812, "step": 12716 }, { "epoch": 0.38, "learning_rate": 3.5358137468107467e-06, "loss": 1.2395, "step": 12717 }, { "epoch": 0.38, "learning_rate": 3.535591743226954e-06, "loss": 1.1613, "step": 12718 }, { "epoch": 0.38, "learning_rate": 3.5353697297848254e-06, "loss": 1.1616, "step": 12719 }, { "epoch": 0.38, "learning_rate": 3.535147706486477e-06, "loss": 1.2064, "step": 12720 }, { "epoch": 0.38, "learning_rate": 3.53492567333402e-06, "loss": 1.0447, "step": 12721 }, { "epoch": 0.38, "learning_rate": 3.534703630329569e-06, "loss": 1.1985, "step": 12722 }, { "epoch": 0.38, "learning_rate": 3.534481577475238e-06, "loss": 1.108, "step": 12723 }, { "epoch": 0.38, "learning_rate": 3.5342595147731413e-06, "loss": 1.2112, "step": 12724 }, { "epoch": 0.38, "learning_rate": 3.5340374422253913e-06, "loss": 1.1881, "step": 12725 }, { "epoch": 0.38, "learning_rate": 3.5338153598341037e-06, "loss": 1.116, "step": 12726 }, { "epoch": 0.38, "learning_rate": 3.5335932676013906e-06, "loss": 0.9906, "step": 12727 }, { "epoch": 0.38, "learning_rate": 3.5333711655293683e-06, "loss": 1.0804, "step": 12728 }, { "epoch": 0.38, "learning_rate": 3.53314905362015e-06, "loss": 1.2641, "step": 12729 }, { "epoch": 0.38, "learning_rate": 3.5329269318758508e-06, "loss": 1.2264, "step": 12730 }, { "epoch": 0.38, "learning_rate": 3.5327048002985835e-06, "loss": 1.0438, "step": 12731 }, { "epoch": 0.38, "learning_rate": 3.532482658890464e-06, "loss": 1.2009, "step": 12732 }, { "epoch": 0.38, "learning_rate": 3.5322605076536084e-06, "loss": 1.1442, "step": 12733 }, { "epoch": 0.38, "learning_rate": 3.532038346590128e-06, "loss": 1.0728, "step": 12734 }, { "epoch": 0.38, "learning_rate": 3.531816175702141e-06, "loss": 1.095, "step": 12735 }, { "epoch": 0.38, "learning_rate": 3.5315939949917598e-06, "loss": 1.1334, "step": 12736 }, { "epoch": 0.38, "learning_rate": 3.531371804461101e-06, "loss": 1.0933, "step": 12737 }, { "epoch": 0.38, "learning_rate": 3.5311496041122796e-06, "loss": 1.0524, "step": 12738 }, { "epoch": 0.38, "learning_rate": 3.530927393947411e-06, "loss": 1.1342, "step": 12739 }, { "epoch": 0.38, "learning_rate": 3.5307051739686092e-06, "loss": 1.2136, "step": 12740 }, { "epoch": 0.38, "learning_rate": 3.5304829441779916e-06, "loss": 1.0613, "step": 12741 }, { "epoch": 0.38, "learning_rate": 3.5302607045776715e-06, "loss": 1.0876, "step": 12742 }, { "epoch": 0.38, "learning_rate": 3.5300384551697665e-06, "loss": 1.1123, "step": 12743 }, { "epoch": 0.38, "learning_rate": 3.529816195956391e-06, "loss": 1.1604, "step": 12744 }, { "epoch": 0.38, "learning_rate": 3.5295939269396613e-06, "loss": 1.1272, "step": 12745 }, { "epoch": 0.38, "learning_rate": 3.5293716481216938e-06, "loss": 1.1642, "step": 12746 }, { "epoch": 0.38, "learning_rate": 3.529149359504603e-06, "loss": 1.1254, "step": 12747 }, { "epoch": 0.38, "learning_rate": 3.5289270610905076e-06, "loss": 1.1977, "step": 12748 }, { "epoch": 0.38, "learning_rate": 3.5287047528815212e-06, "loss": 1.1073, "step": 12749 }, { "epoch": 0.38, "learning_rate": 3.5284824348797604e-06, "loss": 1.2683, "step": 12750 }, { "epoch": 0.38, "learning_rate": 3.528260107087342e-06, "loss": 1.0622, "step": 12751 }, { "epoch": 0.38, "learning_rate": 3.528037769506384e-06, "loss": 1.0687, "step": 12752 }, { "epoch": 0.38, "learning_rate": 3.5278154221390004e-06, "loss": 1.1149, "step": 12753 }, { "epoch": 0.38, "learning_rate": 3.5275930649873102e-06, "loss": 1.0522, "step": 12754 }, { "epoch": 0.38, "learning_rate": 3.527370698053428e-06, "loss": 1.0836, "step": 12755 }, { "epoch": 0.38, "learning_rate": 3.527148321339472e-06, "loss": 1.0834, "step": 12756 }, { "epoch": 0.38, "learning_rate": 3.526925934847558e-06, "loss": 1.0904, "step": 12757 }, { "epoch": 0.38, "learning_rate": 3.5267035385798038e-06, "loss": 1.1833, "step": 12758 }, { "epoch": 0.38, "learning_rate": 3.526481132538327e-06, "loss": 1.1166, "step": 12759 }, { "epoch": 0.38, "learning_rate": 3.5262587167252438e-06, "loss": 1.1075, "step": 12760 }, { "epoch": 0.38, "learning_rate": 3.526036291142672e-06, "loss": 1.1615, "step": 12761 }, { "epoch": 0.38, "learning_rate": 3.5258138557927286e-06, "loss": 1.1931, "step": 12762 }, { "epoch": 0.38, "learning_rate": 3.525591410677531e-06, "loss": 1.1714, "step": 12763 }, { "epoch": 0.38, "learning_rate": 3.5253689557991975e-06, "loss": 1.101, "step": 12764 }, { "epoch": 0.38, "learning_rate": 3.525146491159846e-06, "loss": 0.9733, "step": 12765 }, { "epoch": 0.38, "learning_rate": 3.524924016761593e-06, "loss": 1.212, "step": 12766 }, { "epoch": 0.38, "learning_rate": 3.5247015326065577e-06, "loss": 1.1415, "step": 12767 }, { "epoch": 0.38, "learning_rate": 3.5244790386968564e-06, "loss": 1.0754, "step": 12768 }, { "epoch": 0.38, "learning_rate": 3.5242565350346088e-06, "loss": 1.0306, "step": 12769 }, { "epoch": 0.38, "learning_rate": 3.5240340216219315e-06, "loss": 1.1735, "step": 12770 }, { "epoch": 0.38, "learning_rate": 3.523811498460944e-06, "loss": 1.1417, "step": 12771 }, { "epoch": 0.38, "learning_rate": 3.523588965553764e-06, "loss": 1.1052, "step": 12772 }, { "epoch": 0.38, "learning_rate": 3.5233664229025098e-06, "loss": 1.2075, "step": 12773 }, { "epoch": 0.38, "learning_rate": 3.5231438705093013e-06, "loss": 1.2371, "step": 12774 }, { "epoch": 0.38, "learning_rate": 3.522921308376255e-06, "loss": 0.986, "step": 12775 }, { "epoch": 0.38, "learning_rate": 3.52269873650549e-06, "loss": 1.2732, "step": 12776 }, { "epoch": 0.38, "learning_rate": 3.5224761548991253e-06, "loss": 1.1771, "step": 12777 }, { "epoch": 0.38, "learning_rate": 3.5222535635592814e-06, "loss": 1.1035, "step": 12778 }, { "epoch": 0.38, "learning_rate": 3.522030962488075e-06, "loss": 1.1401, "step": 12779 }, { "epoch": 0.38, "learning_rate": 3.5218083516876266e-06, "loss": 1.1334, "step": 12780 }, { "epoch": 0.39, "learning_rate": 3.521585731160055e-06, "loss": 1.1922, "step": 12781 }, { "epoch": 0.39, "learning_rate": 3.5213631009074788e-06, "loss": 1.1219, "step": 12782 }, { "epoch": 0.39, "learning_rate": 3.5211404609320177e-06, "loss": 1.188, "step": 12783 }, { "epoch": 0.39, "learning_rate": 3.520917811235791e-06, "loss": 1.0478, "step": 12784 }, { "epoch": 0.39, "learning_rate": 3.5206951518209192e-06, "loss": 1.1262, "step": 12785 }, { "epoch": 0.39, "learning_rate": 3.5204724826895203e-06, "loss": 1.0997, "step": 12786 }, { "epoch": 0.39, "learning_rate": 3.520249803843716e-06, "loss": 1.158, "step": 12787 }, { "epoch": 0.39, "learning_rate": 3.5200271152856237e-06, "loss": 1.2258, "step": 12788 }, { "epoch": 0.39, "learning_rate": 3.519804417017365e-06, "loss": 1.1532, "step": 12789 }, { "epoch": 0.39, "learning_rate": 3.5195817090410593e-06, "loss": 1.1434, "step": 12790 }, { "epoch": 0.39, "learning_rate": 3.519358991358827e-06, "loss": 1.1844, "step": 12791 }, { "epoch": 0.39, "learning_rate": 3.5191362639727875e-06, "loss": 1.2716, "step": 12792 }, { "epoch": 0.39, "learning_rate": 3.5189135268850626e-06, "loss": 1.1664, "step": 12793 }, { "epoch": 0.39, "learning_rate": 3.5186907800977708e-06, "loss": 1.2273, "step": 12794 }, { "epoch": 0.39, "learning_rate": 3.518468023613034e-06, "loss": 1.091, "step": 12795 }, { "epoch": 0.39, "learning_rate": 3.5182452574329717e-06, "loss": 1.0894, "step": 12796 }, { "epoch": 0.39, "learning_rate": 3.5180224815597047e-06, "loss": 1.1056, "step": 12797 }, { "epoch": 0.39, "learning_rate": 3.5177996959953546e-06, "loss": 1.174, "step": 12798 }, { "epoch": 0.39, "learning_rate": 3.517576900742041e-06, "loss": 1.0443, "step": 12799 }, { "epoch": 0.39, "learning_rate": 3.5173540958018865e-06, "loss": 1.1282, "step": 12800 }, { "epoch": 0.39, "learning_rate": 3.5171312811770096e-06, "loss": 1.2771, "step": 12801 }, { "epoch": 0.39, "learning_rate": 3.516908456869534e-06, "loss": 1.1516, "step": 12802 }, { "epoch": 0.39, "learning_rate": 3.5166856228815786e-06, "loss": 1.1185, "step": 12803 }, { "epoch": 0.39, "learning_rate": 3.516462779215266e-06, "loss": 1.0839, "step": 12804 }, { "epoch": 0.39, "learning_rate": 3.5162399258727177e-06, "loss": 1.0844, "step": 12805 }, { "epoch": 0.39, "learning_rate": 3.516017062856054e-06, "loss": 1.2119, "step": 12806 }, { "epoch": 0.39, "learning_rate": 3.5157941901673976e-06, "loss": 1.0508, "step": 12807 }, { "epoch": 0.39, "learning_rate": 3.5155713078088704e-06, "loss": 1.1942, "step": 12808 }, { "epoch": 0.39, "learning_rate": 3.5153484157825924e-06, "loss": 1.1257, "step": 12809 }, { "epoch": 0.39, "learning_rate": 3.515125514090687e-06, "loss": 1.0925, "step": 12810 }, { "epoch": 0.39, "learning_rate": 3.5149026027352758e-06, "loss": 1.0437, "step": 12811 }, { "epoch": 0.39, "learning_rate": 3.5146796817184803e-06, "loss": 1.2087, "step": 12812 }, { "epoch": 0.39, "learning_rate": 3.514456751042423e-06, "loss": 1.1509, "step": 12813 }, { "epoch": 0.39, "learning_rate": 3.514233810709226e-06, "loss": 1.1556, "step": 12814 }, { "epoch": 0.39, "learning_rate": 3.514010860721012e-06, "loss": 1.1281, "step": 12815 }, { "epoch": 0.39, "learning_rate": 3.5137879010799025e-06, "loss": 1.1232, "step": 12816 }, { "epoch": 0.39, "learning_rate": 3.51356493178802e-06, "loss": 1.2056, "step": 12817 }, { "epoch": 0.39, "learning_rate": 3.513341952847488e-06, "loss": 1.1411, "step": 12818 }, { "epoch": 0.39, "learning_rate": 3.5131189642604292e-06, "loss": 1.0745, "step": 12819 }, { "epoch": 0.39, "learning_rate": 3.5128959660289646e-06, "loss": 1.0607, "step": 12820 }, { "epoch": 0.39, "learning_rate": 3.5126729581552194e-06, "loss": 1.132, "step": 12821 }, { "epoch": 0.39, "learning_rate": 3.5124499406413144e-06, "loss": 1.0295, "step": 12822 }, { "epoch": 0.39, "learning_rate": 3.5122269134893743e-06, "loss": 1.1774, "step": 12823 }, { "epoch": 0.39, "learning_rate": 3.512003876701521e-06, "loss": 1.1486, "step": 12824 }, { "epoch": 0.39, "learning_rate": 3.5117808302798784e-06, "loss": 1.2402, "step": 12825 }, { "epoch": 0.39, "learning_rate": 3.5115577742265694e-06, "loss": 1.146, "step": 12826 }, { "epoch": 0.39, "learning_rate": 3.511334708543718e-06, "loss": 1.1484, "step": 12827 }, { "epoch": 0.39, "learning_rate": 3.5111116332334472e-06, "loss": 1.0554, "step": 12828 }, { "epoch": 0.39, "learning_rate": 3.51088854829788e-06, "loss": 1.1833, "step": 12829 }, { "epoch": 0.39, "learning_rate": 3.5106654537391418e-06, "loss": 1.1882, "step": 12830 }, { "epoch": 0.39, "learning_rate": 3.5104423495593544e-06, "loss": 1.1888, "step": 12831 }, { "epoch": 0.39, "learning_rate": 3.5102192357606422e-06, "loss": 1.1298, "step": 12832 }, { "epoch": 0.39, "learning_rate": 3.5099961123451297e-06, "loss": 1.1555, "step": 12833 }, { "epoch": 0.39, "learning_rate": 3.509772979314941e-06, "loss": 1.0938, "step": 12834 }, { "epoch": 0.39, "learning_rate": 3.5095498366721994e-06, "loss": 1.043, "step": 12835 }, { "epoch": 0.39, "learning_rate": 3.50932668441903e-06, "loss": 1.1289, "step": 12836 }, { "epoch": 0.39, "learning_rate": 3.5091035225575563e-06, "loss": 1.2224, "step": 12837 }, { "epoch": 0.39, "learning_rate": 3.5088803510899028e-06, "loss": 1.2036, "step": 12838 }, { "epoch": 0.39, "learning_rate": 3.5086571700181954e-06, "loss": 1.1472, "step": 12839 }, { "epoch": 0.39, "learning_rate": 3.5084339793445563e-06, "loss": 1.1525, "step": 12840 }, { "epoch": 0.39, "learning_rate": 3.508210779071112e-06, "loss": 1.0886, "step": 12841 }, { "epoch": 0.39, "learning_rate": 3.5079875691999864e-06, "loss": 1.1331, "step": 12842 }, { "epoch": 0.39, "learning_rate": 3.507764349733305e-06, "loss": 1.1697, "step": 12843 }, { "epoch": 0.39, "learning_rate": 3.5075411206731925e-06, "loss": 1.1791, "step": 12844 }, { "epoch": 0.39, "learning_rate": 3.507317882021773e-06, "loss": 1.2053, "step": 12845 }, { "epoch": 0.39, "learning_rate": 3.507094633781173e-06, "loss": 1.1106, "step": 12846 }, { "epoch": 0.39, "learning_rate": 3.5068713759535167e-06, "loss": 1.1509, "step": 12847 }, { "epoch": 0.39, "learning_rate": 3.5066481085409297e-06, "loss": 1.2367, "step": 12848 }, { "epoch": 0.39, "learning_rate": 3.5064248315455383e-06, "loss": 0.9528, "step": 12849 }, { "epoch": 0.39, "learning_rate": 3.5062015449694666e-06, "loss": 1.2608, "step": 12850 }, { "epoch": 0.39, "learning_rate": 3.505978248814841e-06, "loss": 1.1544, "step": 12851 }, { "epoch": 0.39, "learning_rate": 3.5057549430837873e-06, "loss": 1.1575, "step": 12852 }, { "epoch": 0.39, "learning_rate": 3.5055316277784303e-06, "loss": 1.1855, "step": 12853 }, { "epoch": 0.39, "learning_rate": 3.505308302900897e-06, "loss": 1.1901, "step": 12854 }, { "epoch": 0.39, "learning_rate": 3.5050849684533124e-06, "loss": 1.1942, "step": 12855 }, { "epoch": 0.39, "learning_rate": 3.5048616244378036e-06, "loss": 1.1652, "step": 12856 }, { "epoch": 0.39, "learning_rate": 3.504638270856495e-06, "loss": 1.0707, "step": 12857 }, { "epoch": 0.39, "learning_rate": 3.5044149077115147e-06, "loss": 1.1098, "step": 12858 }, { "epoch": 0.39, "learning_rate": 3.5041915350049875e-06, "loss": 1.1591, "step": 12859 }, { "epoch": 0.39, "learning_rate": 3.5039681527390417e-06, "loss": 1.1727, "step": 12860 }, { "epoch": 0.39, "learning_rate": 3.5037447609158016e-06, "loss": 1.2108, "step": 12861 }, { "epoch": 0.39, "learning_rate": 3.503521359537396e-06, "loss": 1.1376, "step": 12862 }, { "epoch": 0.39, "learning_rate": 3.5032979486059493e-06, "loss": 1.0881, "step": 12863 }, { "epoch": 0.39, "learning_rate": 3.5030745281235888e-06, "loss": 1.2238, "step": 12864 }, { "epoch": 0.39, "learning_rate": 3.5028510980924437e-06, "loss": 1.1534, "step": 12865 }, { "epoch": 0.39, "learning_rate": 3.502627658514638e-06, "loss": 1.1005, "step": 12866 }, { "epoch": 0.39, "learning_rate": 3.5024042093923e-06, "loss": 1.2382, "step": 12867 }, { "epoch": 0.39, "learning_rate": 3.5021807507275564e-06, "loss": 1.1747, "step": 12868 }, { "epoch": 0.39, "learning_rate": 3.501957282522536e-06, "loss": 1.2826, "step": 12869 }, { "epoch": 0.39, "learning_rate": 3.501733804779363e-06, "loss": 1.1226, "step": 12870 }, { "epoch": 0.39, "learning_rate": 3.501510317500168e-06, "loss": 1.1357, "step": 12871 }, { "epoch": 0.39, "learning_rate": 3.5012868206870766e-06, "loss": 1.1573, "step": 12872 }, { "epoch": 0.39, "learning_rate": 3.501063314342217e-06, "loss": 1.1771, "step": 12873 }, { "epoch": 0.39, "learning_rate": 3.500839798467716e-06, "loss": 1.111, "step": 12874 }, { "epoch": 0.39, "learning_rate": 3.5006162730657035e-06, "loss": 1.2794, "step": 12875 }, { "epoch": 0.39, "learning_rate": 3.5003927381383045e-06, "loss": 1.1602, "step": 12876 }, { "epoch": 0.39, "learning_rate": 3.500169193687649e-06, "loss": 1.0966, "step": 12877 }, { "epoch": 0.39, "learning_rate": 3.4999456397158655e-06, "loss": 1.1699, "step": 12878 }, { "epoch": 0.39, "learning_rate": 3.49972207622508e-06, "loss": 1.1322, "step": 12879 }, { "epoch": 0.39, "learning_rate": 3.4994985032174222e-06, "loss": 1.0244, "step": 12880 }, { "epoch": 0.39, "learning_rate": 3.49927492069502e-06, "loss": 1.3572, "step": 12881 }, { "epoch": 0.39, "learning_rate": 3.4990513286600027e-06, "loss": 1.0399, "step": 12882 }, { "epoch": 0.39, "learning_rate": 3.4988277271144966e-06, "loss": 1.0788, "step": 12883 }, { "epoch": 0.39, "learning_rate": 3.4986041160606323e-06, "loss": 1.0488, "step": 12884 }, { "epoch": 0.39, "learning_rate": 3.4983804955005367e-06, "loss": 1.1099, "step": 12885 }, { "epoch": 0.39, "learning_rate": 3.4981568654363405e-06, "loss": 1.1749, "step": 12886 }, { "epoch": 0.39, "learning_rate": 3.4979332258701715e-06, "loss": 1.1776, "step": 12887 }, { "epoch": 0.39, "learning_rate": 3.497709576804159e-06, "loss": 1.2434, "step": 12888 }, { "epoch": 0.39, "learning_rate": 3.4974859182404315e-06, "loss": 1.1525, "step": 12889 }, { "epoch": 0.39, "learning_rate": 3.497262250181118e-06, "loss": 1.1626, "step": 12890 }, { "epoch": 0.39, "learning_rate": 3.4970385726283497e-06, "loss": 1.0375, "step": 12891 }, { "epoch": 0.39, "learning_rate": 3.496814885584253e-06, "loss": 1.251, "step": 12892 }, { "epoch": 0.39, "learning_rate": 3.4965911890509594e-06, "loss": 1.1008, "step": 12893 }, { "epoch": 0.39, "learning_rate": 3.4963674830305978e-06, "loss": 1.0565, "step": 12894 }, { "epoch": 0.39, "learning_rate": 3.4961437675252976e-06, "loss": 1.1668, "step": 12895 }, { "epoch": 0.39, "learning_rate": 3.4959200425371874e-06, "loss": 1.1395, "step": 12896 }, { "epoch": 0.39, "learning_rate": 3.4956963080683996e-06, "loss": 1.1106, "step": 12897 }, { "epoch": 0.39, "learning_rate": 3.495472564121061e-06, "loss": 1.1335, "step": 12898 }, { "epoch": 0.39, "learning_rate": 3.4952488106973036e-06, "loss": 1.1139, "step": 12899 }, { "epoch": 0.39, "learning_rate": 3.4950250477992577e-06, "loss": 1.1984, "step": 12900 }, { "epoch": 0.39, "learning_rate": 3.494801275429052e-06, "loss": 1.1599, "step": 12901 }, { "epoch": 0.39, "learning_rate": 3.4945774935888166e-06, "loss": 1.064, "step": 12902 }, { "epoch": 0.39, "learning_rate": 3.494353702280683e-06, "loss": 1.1275, "step": 12903 }, { "epoch": 0.39, "learning_rate": 3.4941299015067807e-06, "loss": 1.1646, "step": 12904 }, { "epoch": 0.39, "learning_rate": 3.493906091269241e-06, "loss": 1.1263, "step": 12905 }, { "epoch": 0.39, "learning_rate": 3.4936822715701945e-06, "loss": 1.1837, "step": 12906 }, { "epoch": 0.39, "learning_rate": 3.49345844241177e-06, "loss": 1.1188, "step": 12907 }, { "epoch": 0.39, "learning_rate": 3.4932346037961006e-06, "loss": 1.2433, "step": 12908 }, { "epoch": 0.39, "learning_rate": 3.4930107557253156e-06, "loss": 1.1089, "step": 12909 }, { "epoch": 0.39, "learning_rate": 3.492786898201547e-06, "loss": 1.0659, "step": 12910 }, { "epoch": 0.39, "learning_rate": 3.4925630312269253e-06, "loss": 1.0608, "step": 12911 }, { "epoch": 0.39, "learning_rate": 3.4923391548035814e-06, "loss": 1.1425, "step": 12912 }, { "epoch": 0.39, "learning_rate": 3.492115268933646e-06, "loss": 1.1066, "step": 12913 }, { "epoch": 0.39, "learning_rate": 3.4918913736192517e-06, "loss": 1.0202, "step": 12914 }, { "epoch": 0.39, "learning_rate": 3.491667468862529e-06, "loss": 1.0333, "step": 12915 }, { "epoch": 0.39, "learning_rate": 3.49144355466561e-06, "loss": 1.0766, "step": 12916 }, { "epoch": 0.39, "learning_rate": 3.491219631030625e-06, "loss": 1.1796, "step": 12917 }, { "epoch": 0.39, "learning_rate": 3.490995697959707e-06, "loss": 1.1696, "step": 12918 }, { "epoch": 0.39, "learning_rate": 3.4907717554549882e-06, "loss": 1.1546, "step": 12919 }, { "epoch": 0.39, "learning_rate": 3.490547803518598e-06, "loss": 1.1542, "step": 12920 }, { "epoch": 0.39, "learning_rate": 3.4903238421526706e-06, "loss": 1.0907, "step": 12921 }, { "epoch": 0.39, "learning_rate": 3.4900998713593367e-06, "loss": 1.2152, "step": 12922 }, { "epoch": 0.39, "learning_rate": 3.489875891140729e-06, "loss": 1.135, "step": 12923 }, { "epoch": 0.39, "learning_rate": 3.48965190149898e-06, "loss": 1.1099, "step": 12924 }, { "epoch": 0.39, "learning_rate": 3.489427902436221e-06, "loss": 1.1409, "step": 12925 }, { "epoch": 0.39, "learning_rate": 3.4892038939545854e-06, "loss": 1.2159, "step": 12926 }, { "epoch": 0.39, "learning_rate": 3.4889798760562043e-06, "loss": 1.0767, "step": 12927 }, { "epoch": 0.39, "learning_rate": 3.4887558487432116e-06, "loss": 1.1139, "step": 12928 }, { "epoch": 0.39, "learning_rate": 3.4885318120177398e-06, "loss": 1.0987, "step": 12929 }, { "epoch": 0.39, "learning_rate": 3.4883077658819204e-06, "loss": 1.1414, "step": 12930 }, { "epoch": 0.39, "learning_rate": 3.4880837103378875e-06, "loss": 1.2441, "step": 12931 }, { "epoch": 0.39, "learning_rate": 3.487859645387774e-06, "loss": 1.1537, "step": 12932 }, { "epoch": 0.39, "learning_rate": 3.4876355710337117e-06, "loss": 1.186, "step": 12933 }, { "epoch": 0.39, "learning_rate": 3.4874114872778345e-06, "loss": 1.149, "step": 12934 }, { "epoch": 0.39, "learning_rate": 3.4871873941222756e-06, "loss": 1.1317, "step": 12935 }, { "epoch": 0.39, "learning_rate": 3.4869632915691686e-06, "loss": 1.1406, "step": 12936 }, { "epoch": 0.39, "learning_rate": 3.4867391796206464e-06, "loss": 0.973, "step": 12937 }, { "epoch": 0.39, "learning_rate": 3.486515058278842e-06, "loss": 1.1524, "step": 12938 }, { "epoch": 0.39, "learning_rate": 3.4862909275458896e-06, "loss": 1.2191, "step": 12939 }, { "epoch": 0.39, "learning_rate": 3.4860667874239225e-06, "loss": 1.1203, "step": 12940 }, { "epoch": 0.39, "learning_rate": 3.485842637915074e-06, "loss": 1.098, "step": 12941 }, { "epoch": 0.39, "learning_rate": 3.485618479021479e-06, "loss": 1.1069, "step": 12942 }, { "epoch": 0.39, "learning_rate": 3.4853943107452704e-06, "loss": 1.1184, "step": 12943 }, { "epoch": 0.39, "learning_rate": 3.4851701330885828e-06, "loss": 1.1972, "step": 12944 }, { "epoch": 0.39, "learning_rate": 3.48494594605355e-06, "loss": 1.261, "step": 12945 }, { "epoch": 0.39, "learning_rate": 3.4847217496423062e-06, "loss": 1.1406, "step": 12946 }, { "epoch": 0.39, "learning_rate": 3.484497543856986e-06, "loss": 1.1389, "step": 12947 }, { "epoch": 0.39, "learning_rate": 3.4842733286997225e-06, "loss": 1.2441, "step": 12948 }, { "epoch": 0.39, "learning_rate": 3.4840491041726514e-06, "loss": 1.0935, "step": 12949 }, { "epoch": 0.39, "learning_rate": 3.4838248702779066e-06, "loss": 1.0865, "step": 12950 }, { "epoch": 0.39, "learning_rate": 3.4836006270176236e-06, "loss": 1.0657, "step": 12951 }, { "epoch": 0.39, "learning_rate": 3.483376374393935e-06, "loss": 1.0892, "step": 12952 }, { "epoch": 0.39, "learning_rate": 3.4831521124089783e-06, "loss": 1.0846, "step": 12953 }, { "epoch": 0.39, "learning_rate": 3.482927841064886e-06, "loss": 1.09, "step": 12954 }, { "epoch": 0.39, "learning_rate": 3.4827035603637942e-06, "loss": 1.2578, "step": 12955 }, { "epoch": 0.39, "learning_rate": 3.482479270307838e-06, "loss": 1.0939, "step": 12956 }, { "epoch": 0.39, "learning_rate": 3.482254970899152e-06, "loss": 1.0418, "step": 12957 }, { "epoch": 0.39, "learning_rate": 3.4820306621398726e-06, "loss": 1.1382, "step": 12958 }, { "epoch": 0.39, "learning_rate": 3.481806344032133e-06, "loss": 0.9881, "step": 12959 }, { "epoch": 0.39, "learning_rate": 3.481582016578071e-06, "loss": 1.0876, "step": 12960 }, { "epoch": 0.39, "learning_rate": 3.4813576797798206e-06, "loss": 1.2086, "step": 12961 }, { "epoch": 0.39, "learning_rate": 3.4811333336395176e-06, "loss": 1.1804, "step": 12962 }, { "epoch": 0.39, "learning_rate": 3.4809089781592974e-06, "loss": 1.05, "step": 12963 }, { "epoch": 0.39, "learning_rate": 3.480684613341297e-06, "loss": 1.0497, "step": 12964 }, { "epoch": 0.39, "learning_rate": 3.4804602391876507e-06, "loss": 0.9976, "step": 12965 }, { "epoch": 0.39, "learning_rate": 3.4802358557004957e-06, "loss": 1.2047, "step": 12966 }, { "epoch": 0.39, "learning_rate": 3.480011462881967e-06, "loss": 1.1429, "step": 12967 }, { "epoch": 0.39, "learning_rate": 3.479787060734201e-06, "loss": 1.1224, "step": 12968 }, { "epoch": 0.39, "learning_rate": 3.4795626492593344e-06, "loss": 1.1367, "step": 12969 }, { "epoch": 0.39, "learning_rate": 3.4793382284595027e-06, "loss": 1.0373, "step": 12970 }, { "epoch": 0.39, "learning_rate": 3.479113798336844e-06, "loss": 1.1185, "step": 12971 }, { "epoch": 0.39, "learning_rate": 3.4788893588934923e-06, "loss": 1.0435, "step": 12972 }, { "epoch": 0.39, "learning_rate": 3.478664910131586e-06, "loss": 1.1738, "step": 12973 }, { "epoch": 0.39, "learning_rate": 3.4784404520532604e-06, "loss": 1.2348, "step": 12974 }, { "epoch": 0.39, "learning_rate": 3.4782159846606535e-06, "loss": 1.0502, "step": 12975 }, { "epoch": 0.39, "learning_rate": 3.477991507955901e-06, "loss": 1.1012, "step": 12976 }, { "epoch": 0.39, "learning_rate": 3.4777670219411414e-06, "loss": 1.149, "step": 12977 }, { "epoch": 0.39, "learning_rate": 3.47754252661851e-06, "loss": 1.0762, "step": 12978 }, { "epoch": 0.39, "learning_rate": 3.477318021990145e-06, "loss": 1.2213, "step": 12979 }, { "epoch": 0.39, "learning_rate": 3.4770935080581826e-06, "loss": 1.2108, "step": 12980 }, { "epoch": 0.39, "learning_rate": 3.47686898482476e-06, "loss": 1.1461, "step": 12981 }, { "epoch": 0.39, "learning_rate": 3.4766444522920157e-06, "loss": 1.0872, "step": 12982 }, { "epoch": 0.39, "learning_rate": 3.4764199104620864e-06, "loss": 1.2036, "step": 12983 }, { "epoch": 0.39, "learning_rate": 3.47619535933711e-06, "loss": 1.0948, "step": 12984 }, { "epoch": 0.39, "learning_rate": 3.4759707989192243e-06, "loss": 1.059, "step": 12985 }, { "epoch": 0.39, "learning_rate": 3.4757462292105664e-06, "loss": 1.1663, "step": 12986 }, { "epoch": 0.39, "learning_rate": 3.4755216502132744e-06, "loss": 1.1074, "step": 12987 }, { "epoch": 0.39, "learning_rate": 3.4752970619294863e-06, "loss": 1.141, "step": 12988 }, { "epoch": 0.39, "learning_rate": 3.4750724643613392e-06, "loss": 1.1216, "step": 12989 }, { "epoch": 0.39, "learning_rate": 3.474847857510973e-06, "loss": 1.0673, "step": 12990 }, { "epoch": 0.39, "learning_rate": 3.4746232413805237e-06, "loss": 1.0458, "step": 12991 }, { "epoch": 0.39, "learning_rate": 3.474398615972131e-06, "loss": 1.1592, "step": 12992 }, { "epoch": 0.39, "learning_rate": 3.474173981287932e-06, "loss": 1.1157, "step": 12993 }, { "epoch": 0.39, "learning_rate": 3.473949337330067e-06, "loss": 1.2185, "step": 12994 }, { "epoch": 0.39, "learning_rate": 3.473724684100672e-06, "loss": 1.156, "step": 12995 }, { "epoch": 0.39, "learning_rate": 3.4735000216018883e-06, "loss": 1.1496, "step": 12996 }, { "epoch": 0.39, "learning_rate": 3.4732753498358522e-06, "loss": 1.194, "step": 12997 }, { "epoch": 0.39, "learning_rate": 3.4730506688047038e-06, "loss": 1.2562, "step": 12998 }, { "epoch": 0.39, "learning_rate": 3.472825978510582e-06, "loss": 1.2246, "step": 12999 }, { "epoch": 0.39, "learning_rate": 3.4726012789556257e-06, "loss": 1.2668, "step": 13000 }, { "epoch": 0.39, "learning_rate": 3.4723765701419732e-06, "loss": 1.104, "step": 13001 }, { "epoch": 0.39, "learning_rate": 3.472151852071764e-06, "loss": 1.0623, "step": 13002 }, { "epoch": 0.39, "learning_rate": 3.471927124747138e-06, "loss": 1.1057, "step": 13003 }, { "epoch": 0.39, "learning_rate": 3.4717023881702332e-06, "loss": 1.152, "step": 13004 }, { "epoch": 0.39, "learning_rate": 3.47147764234319e-06, "loss": 1.2186, "step": 13005 }, { "epoch": 0.39, "learning_rate": 3.4712528872681473e-06, "loss": 1.1698, "step": 13006 }, { "epoch": 0.39, "learning_rate": 3.4710281229472455e-06, "loss": 1.0957, "step": 13007 }, { "epoch": 0.39, "learning_rate": 3.4708033493826226e-06, "loss": 1.1307, "step": 13008 }, { "epoch": 0.39, "learning_rate": 3.4705785665764197e-06, "loss": 1.2391, "step": 13009 }, { "epoch": 0.39, "learning_rate": 3.470353774530776e-06, "loss": 1.1578, "step": 13010 }, { "epoch": 0.39, "learning_rate": 3.470128973247832e-06, "loss": 1.2556, "step": 13011 }, { "epoch": 0.39, "learning_rate": 3.4699041627297283e-06, "loss": 1.2441, "step": 13012 }, { "epoch": 0.39, "learning_rate": 3.4696793429786024e-06, "loss": 1.1851, "step": 13013 }, { "epoch": 0.39, "learning_rate": 3.4694545139965974e-06, "loss": 1.0704, "step": 13014 }, { "epoch": 0.39, "learning_rate": 3.4692296757858525e-06, "loss": 1.1176, "step": 13015 }, { "epoch": 0.39, "learning_rate": 3.4690048283485074e-06, "loss": 1.1026, "step": 13016 }, { "epoch": 0.39, "learning_rate": 3.4687799716867028e-06, "loss": 1.2176, "step": 13017 }, { "epoch": 0.39, "learning_rate": 3.46855510580258e-06, "loss": 1.1631, "step": 13018 }, { "epoch": 0.39, "learning_rate": 3.4683302306982784e-06, "loss": 1.0754, "step": 13019 }, { "epoch": 0.39, "learning_rate": 3.46810534637594e-06, "loss": 1.1805, "step": 13020 }, { "epoch": 0.39, "learning_rate": 3.4678804528377047e-06, "loss": 1.127, "step": 13021 }, { "epoch": 0.39, "learning_rate": 3.4676555500857136e-06, "loss": 1.0577, "step": 13022 }, { "epoch": 0.39, "learning_rate": 3.4674306381221074e-06, "loss": 1.1419, "step": 13023 }, { "epoch": 0.39, "learning_rate": 3.467205716949028e-06, "loss": 1.128, "step": 13024 }, { "epoch": 0.39, "learning_rate": 3.4669807865686157e-06, "loss": 1.0308, "step": 13025 }, { "epoch": 0.39, "learning_rate": 3.466755846983012e-06, "loss": 1.1111, "step": 13026 }, { "epoch": 0.39, "learning_rate": 3.4665308981943583e-06, "loss": 1.1439, "step": 13027 }, { "epoch": 0.39, "learning_rate": 3.466305940204796e-06, "loss": 1.1375, "step": 13028 }, { "epoch": 0.39, "learning_rate": 3.466080973016467e-06, "loss": 0.9979, "step": 13029 }, { "epoch": 0.39, "learning_rate": 3.4658559966315115e-06, "loss": 1.0165, "step": 13030 }, { "epoch": 0.39, "learning_rate": 3.465631011052073e-06, "loss": 1.2375, "step": 13031 }, { "epoch": 0.39, "learning_rate": 3.4654060162802918e-06, "loss": 1.2238, "step": 13032 }, { "epoch": 0.39, "learning_rate": 3.4651810123183104e-06, "loss": 1.1254, "step": 13033 }, { "epoch": 0.39, "learning_rate": 3.4649559991682703e-06, "loss": 1.0142, "step": 13034 }, { "epoch": 0.39, "learning_rate": 3.4647309768323147e-06, "loss": 1.1145, "step": 13035 }, { "epoch": 0.39, "learning_rate": 3.464505945312584e-06, "loss": 1.0945, "step": 13036 }, { "epoch": 0.39, "learning_rate": 3.464280904611221e-06, "loss": 1.1427, "step": 13037 }, { "epoch": 0.39, "learning_rate": 3.4640558547303683e-06, "loss": 1.0853, "step": 13038 }, { "epoch": 0.39, "learning_rate": 3.4638307956721683e-06, "loss": 1.1553, "step": 13039 }, { "epoch": 0.39, "learning_rate": 3.4636057274387642e-06, "loss": 1.2469, "step": 13040 }, { "epoch": 0.39, "learning_rate": 3.4633806500322966e-06, "loss": 1.1013, "step": 13041 }, { "epoch": 0.39, "learning_rate": 3.4631555634549096e-06, "loss": 1.2518, "step": 13042 }, { "epoch": 0.39, "learning_rate": 3.4629304677087455e-06, "loss": 1.0541, "step": 13043 }, { "epoch": 0.39, "learning_rate": 3.462705362795947e-06, "loss": 1.2051, "step": 13044 }, { "epoch": 0.39, "learning_rate": 3.462480248718657e-06, "loss": 1.1212, "step": 13045 }, { "epoch": 0.39, "learning_rate": 3.462255125479019e-06, "loss": 1.0823, "step": 13046 }, { "epoch": 0.39, "learning_rate": 3.4620299930791755e-06, "loss": 1.2076, "step": 13047 }, { "epoch": 0.39, "learning_rate": 3.4618048515212704e-06, "loss": 1.0881, "step": 13048 }, { "epoch": 0.39, "learning_rate": 3.4615797008074452e-06, "loss": 1.1683, "step": 13049 }, { "epoch": 0.39, "learning_rate": 3.4613545409398447e-06, "loss": 1.1501, "step": 13050 }, { "epoch": 0.39, "learning_rate": 3.461129371920612e-06, "loss": 1.1521, "step": 13051 }, { "epoch": 0.39, "learning_rate": 3.4609041937518904e-06, "loss": 1.1057, "step": 13052 }, { "epoch": 0.39, "learning_rate": 3.4606790064358243e-06, "loss": 1.2153, "step": 13053 }, { "epoch": 0.39, "learning_rate": 3.460453809974556e-06, "loss": 1.114, "step": 13054 }, { "epoch": 0.39, "learning_rate": 3.4602286043702304e-06, "loss": 1.0911, "step": 13055 }, { "epoch": 0.39, "learning_rate": 3.4600033896249907e-06, "loss": 1.0635, "step": 13056 }, { "epoch": 0.39, "learning_rate": 3.4597781657409817e-06, "loss": 1.1529, "step": 13057 }, { "epoch": 0.39, "learning_rate": 3.4595529327203463e-06, "loss": 1.0875, "step": 13058 }, { "epoch": 0.39, "learning_rate": 3.4593276905652297e-06, "loss": 1.0488, "step": 13059 }, { "epoch": 0.39, "learning_rate": 3.459102439277775e-06, "loss": 1.2125, "step": 13060 }, { "epoch": 0.39, "learning_rate": 3.4588771788601273e-06, "loss": 1.0454, "step": 13061 }, { "epoch": 0.39, "learning_rate": 3.45865190931443e-06, "loss": 1.0284, "step": 13062 }, { "epoch": 0.39, "learning_rate": 3.458426630642828e-06, "loss": 1.1139, "step": 13063 }, { "epoch": 0.39, "learning_rate": 3.458201342847467e-06, "loss": 1.1198, "step": 13064 }, { "epoch": 0.39, "learning_rate": 3.4579760459304903e-06, "loss": 1.1648, "step": 13065 }, { "epoch": 0.39, "learning_rate": 3.4577507398940436e-06, "loss": 1.1305, "step": 13066 }, { "epoch": 0.39, "learning_rate": 3.45752542474027e-06, "loss": 1.1758, "step": 13067 }, { "epoch": 0.39, "learning_rate": 3.457300100471317e-06, "loss": 1.1464, "step": 13068 }, { "epoch": 0.39, "learning_rate": 3.4570747670893268e-06, "loss": 1.1947, "step": 13069 }, { "epoch": 0.39, "learning_rate": 3.456849424596446e-06, "loss": 1.0255, "step": 13070 }, { "epoch": 0.39, "learning_rate": 3.4566240729948196e-06, "loss": 1.1669, "step": 13071 }, { "epoch": 0.39, "learning_rate": 3.4563987122865936e-06, "loss": 1.0193, "step": 13072 }, { "epoch": 0.39, "learning_rate": 3.4561733424739112e-06, "loss": 1.1205, "step": 13073 }, { "epoch": 0.39, "learning_rate": 3.45594796355892e-06, "loss": 1.3475, "step": 13074 }, { "epoch": 0.39, "learning_rate": 3.455722575543764e-06, "loss": 1.2115, "step": 13075 }, { "epoch": 0.39, "learning_rate": 3.4554971784305895e-06, "loss": 1.2199, "step": 13076 }, { "epoch": 0.39, "learning_rate": 3.455271772221542e-06, "loss": 1.1525, "step": 13077 }, { "epoch": 0.39, "learning_rate": 3.4550463569187677e-06, "loss": 1.1382, "step": 13078 }, { "epoch": 0.39, "learning_rate": 3.454820932524412e-06, "loss": 1.1647, "step": 13079 }, { "epoch": 0.39, "learning_rate": 3.4545954990406205e-06, "loss": 1.1359, "step": 13080 }, { "epoch": 0.39, "learning_rate": 3.4543700564695397e-06, "loss": 1.2172, "step": 13081 }, { "epoch": 0.39, "learning_rate": 3.4541446048133152e-06, "loss": 1.2517, "step": 13082 }, { "epoch": 0.39, "learning_rate": 3.4539191440740947e-06, "loss": 1.1028, "step": 13083 }, { "epoch": 0.39, "learning_rate": 3.453693674254023e-06, "loss": 1.0032, "step": 13084 }, { "epoch": 0.39, "learning_rate": 3.4534681953552464e-06, "loss": 1.1021, "step": 13085 }, { "epoch": 0.39, "learning_rate": 3.453242707379912e-06, "loss": 1.2041, "step": 13086 }, { "epoch": 0.39, "learning_rate": 3.4530172103301664e-06, "loss": 1.1219, "step": 13087 }, { "epoch": 0.39, "learning_rate": 3.4527917042081556e-06, "loss": 1.1642, "step": 13088 }, { "epoch": 0.39, "learning_rate": 3.452566189016026e-06, "loss": 1.1605, "step": 13089 }, { "epoch": 0.39, "learning_rate": 3.4523406647559266e-06, "loss": 1.1141, "step": 13090 }, { "epoch": 0.39, "learning_rate": 3.4521151314300017e-06, "loss": 1.1785, "step": 13091 }, { "epoch": 0.39, "learning_rate": 3.451889589040399e-06, "loss": 1.2239, "step": 13092 }, { "epoch": 0.39, "learning_rate": 3.4516640375892662e-06, "loss": 1.1445, "step": 13093 }, { "epoch": 0.39, "learning_rate": 3.45143847707875e-06, "loss": 1.1456, "step": 13094 }, { "epoch": 0.39, "learning_rate": 3.451212907510998e-06, "loss": 1.1757, "step": 13095 }, { "epoch": 0.39, "learning_rate": 3.450987328888158e-06, "loss": 1.129, "step": 13096 }, { "epoch": 0.39, "learning_rate": 3.450761741212375e-06, "loss": 1.1645, "step": 13097 }, { "epoch": 0.39, "learning_rate": 3.4505361444857997e-06, "loss": 1.0592, "step": 13098 }, { "epoch": 0.39, "learning_rate": 3.4503105387105773e-06, "loss": 1.165, "step": 13099 }, { "epoch": 0.39, "learning_rate": 3.4500849238888567e-06, "loss": 1.2172, "step": 13100 }, { "epoch": 0.39, "learning_rate": 3.4498593000227843e-06, "loss": 1.1033, "step": 13101 }, { "epoch": 0.39, "learning_rate": 3.4496336671145098e-06, "loss": 1.1747, "step": 13102 }, { "epoch": 0.39, "learning_rate": 3.449408025166179e-06, "loss": 1.0286, "step": 13103 }, { "epoch": 0.39, "learning_rate": 3.4491823741799417e-06, "loss": 1.1921, "step": 13104 }, { "epoch": 0.39, "learning_rate": 3.4489567141579456e-06, "loss": 1.1152, "step": 13105 }, { "epoch": 0.39, "learning_rate": 3.448731045102338e-06, "loss": 1.0801, "step": 13106 }, { "epoch": 0.39, "learning_rate": 3.4485053670152684e-06, "loss": 1.2043, "step": 13107 }, { "epoch": 0.39, "learning_rate": 3.4482796798988842e-06, "loss": 1.084, "step": 13108 }, { "epoch": 0.39, "learning_rate": 3.448053983755335e-06, "loss": 1.1263, "step": 13109 }, { "epoch": 0.39, "learning_rate": 3.4478282785867674e-06, "loss": 1.072, "step": 13110 }, { "epoch": 0.39, "learning_rate": 3.4476025643953317e-06, "loss": 1.2198, "step": 13111 }, { "epoch": 0.39, "learning_rate": 3.4473768411831755e-06, "loss": 1.2976, "step": 13112 }, { "epoch": 0.4, "learning_rate": 3.4471511089524486e-06, "loss": 1.2669, "step": 13113 }, { "epoch": 0.4, "learning_rate": 3.4469253677052983e-06, "loss": 1.1429, "step": 13114 }, { "epoch": 0.4, "learning_rate": 3.446699617443876e-06, "loss": 1.1858, "step": 13115 }, { "epoch": 0.4, "learning_rate": 3.4464738581703284e-06, "loss": 1.1018, "step": 13116 }, { "epoch": 0.4, "learning_rate": 3.446248089886805e-06, "loss": 1.0948, "step": 13117 }, { "epoch": 0.4, "learning_rate": 3.4460223125954563e-06, "loss": 1.2131, "step": 13118 }, { "epoch": 0.4, "learning_rate": 3.4457965262984305e-06, "loss": 1.1304, "step": 13119 }, { "epoch": 0.4, "learning_rate": 3.445570730997877e-06, "loss": 1.1656, "step": 13120 }, { "epoch": 0.4, "learning_rate": 3.445344926695946e-06, "loss": 1.1423, "step": 13121 }, { "epoch": 0.4, "learning_rate": 3.445119113394787e-06, "loss": 1.0006, "step": 13122 }, { "epoch": 0.4, "learning_rate": 3.4448932910965484e-06, "loss": 1.0903, "step": 13123 }, { "epoch": 0.4, "learning_rate": 3.444667459803381e-06, "loss": 1.2366, "step": 13124 }, { "epoch": 0.4, "learning_rate": 3.4444416195174345e-06, "loss": 1.1622, "step": 13125 }, { "epoch": 0.4, "learning_rate": 3.444215770240859e-06, "loss": 1.2274, "step": 13126 }, { "epoch": 0.4, "learning_rate": 3.4439899119758035e-06, "loss": 1.0807, "step": 13127 }, { "epoch": 0.4, "learning_rate": 3.443764044724419e-06, "loss": 1.0544, "step": 13128 }, { "epoch": 0.4, "learning_rate": 3.4435381684888554e-06, "loss": 1.0768, "step": 13129 }, { "epoch": 0.4, "learning_rate": 3.443312283271262e-06, "loss": 1.0817, "step": 13130 }, { "epoch": 0.4, "learning_rate": 3.4430863890737907e-06, "loss": 1.1063, "step": 13131 }, { "epoch": 0.4, "learning_rate": 3.4428604858985916e-06, "loss": 1.1633, "step": 13132 }, { "epoch": 0.4, "learning_rate": 3.442634573747814e-06, "loss": 1.1807, "step": 13133 }, { "epoch": 0.4, "learning_rate": 3.442408652623609e-06, "loss": 1.1333, "step": 13134 }, { "epoch": 0.4, "learning_rate": 3.4421827225281285e-06, "loss": 1.2164, "step": 13135 }, { "epoch": 0.4, "learning_rate": 3.4419567834635213e-06, "loss": 1.2023, "step": 13136 }, { "epoch": 0.4, "learning_rate": 3.44173083543194e-06, "loss": 1.1967, "step": 13137 }, { "epoch": 0.4, "learning_rate": 3.4415048784355343e-06, "loss": 1.1603, "step": 13138 }, { "epoch": 0.4, "learning_rate": 3.441278912476456e-06, "loss": 1.0486, "step": 13139 }, { "epoch": 0.4, "learning_rate": 3.441052937556856e-06, "loss": 1.1155, "step": 13140 }, { "epoch": 0.4, "learning_rate": 3.4408269536788846e-06, "loss": 1.1486, "step": 13141 }, { "epoch": 0.4, "learning_rate": 3.4406009608446933e-06, "loss": 1.1292, "step": 13142 }, { "epoch": 0.4, "learning_rate": 3.4403749590564344e-06, "loss": 1.036, "step": 13143 }, { "epoch": 0.4, "learning_rate": 3.4401489483162592e-06, "loss": 1.1167, "step": 13144 }, { "epoch": 0.4, "learning_rate": 3.4399229286263182e-06, "loss": 1.0782, "step": 13145 }, { "epoch": 0.4, "learning_rate": 3.4396968999887637e-06, "loss": 1.1484, "step": 13146 }, { "epoch": 0.4, "learning_rate": 3.4394708624057472e-06, "loss": 1.1242, "step": 13147 }, { "epoch": 0.4, "learning_rate": 3.439244815879421e-06, "loss": 1.1725, "step": 13148 }, { "epoch": 0.4, "learning_rate": 3.439018760411936e-06, "loss": 1.2198, "step": 13149 }, { "epoch": 0.4, "learning_rate": 3.4387926960054453e-06, "loss": 1.0642, "step": 13150 }, { "epoch": 0.4, "learning_rate": 3.4385666226620996e-06, "loss": 1.1615, "step": 13151 }, { "epoch": 0.4, "learning_rate": 3.4383405403840526e-06, "loss": 1.0474, "step": 13152 }, { "epoch": 0.4, "learning_rate": 3.4381144491734545e-06, "loss": 1.1432, "step": 13153 }, { "epoch": 0.4, "learning_rate": 3.4378883490324593e-06, "loss": 1.0725, "step": 13154 }, { "epoch": 0.4, "learning_rate": 3.437662239963219e-06, "loss": 1.0368, "step": 13155 }, { "epoch": 0.4, "learning_rate": 3.437436121967884e-06, "loss": 1.2119, "step": 13156 }, { "epoch": 0.4, "learning_rate": 3.4372099950486106e-06, "loss": 1.1141, "step": 13157 }, { "epoch": 0.4, "learning_rate": 3.4369838592075488e-06, "loss": 1.1111, "step": 13158 }, { "epoch": 0.4, "learning_rate": 3.4367577144468522e-06, "loss": 1.0104, "step": 13159 }, { "epoch": 0.4, "learning_rate": 3.4365315607686724e-06, "loss": 1.1858, "step": 13160 }, { "epoch": 0.4, "learning_rate": 3.436305398175164e-06, "loss": 1.0375, "step": 13161 }, { "epoch": 0.4, "learning_rate": 3.4360792266684782e-06, "loss": 1.2441, "step": 13162 }, { "epoch": 0.4, "learning_rate": 3.43585304625077e-06, "loss": 1.1212, "step": 13163 }, { "epoch": 0.4, "learning_rate": 3.4356268569241915e-06, "loss": 1.1213, "step": 13164 }, { "epoch": 0.4, "learning_rate": 3.4354006586908954e-06, "loss": 1.2471, "step": 13165 }, { "epoch": 0.4, "learning_rate": 3.435174451553036e-06, "loss": 1.1146, "step": 13166 }, { "epoch": 0.4, "learning_rate": 3.4349482355127663e-06, "loss": 1.1023, "step": 13167 }, { "epoch": 0.4, "learning_rate": 3.434722010572239e-06, "loss": 1.2612, "step": 13168 }, { "epoch": 0.4, "learning_rate": 3.4344957767336083e-06, "loss": 1.2133, "step": 13169 }, { "epoch": 0.4, "learning_rate": 3.434269533999029e-06, "loss": 1.0122, "step": 13170 }, { "epoch": 0.4, "learning_rate": 3.4340432823706525e-06, "loss": 1.1226, "step": 13171 }, { "epoch": 0.4, "learning_rate": 3.4338170218506344e-06, "loss": 1.1879, "step": 13172 }, { "epoch": 0.4, "learning_rate": 3.4335907524411275e-06, "loss": 1.1154, "step": 13173 }, { "epoch": 0.4, "learning_rate": 3.4333644741442867e-06, "loss": 1.1706, "step": 13174 }, { "epoch": 0.4, "learning_rate": 3.4331381869622655e-06, "loss": 1.2142, "step": 13175 }, { "epoch": 0.4, "learning_rate": 3.4329118908972187e-06, "loss": 1.2493, "step": 13176 }, { "epoch": 0.4, "learning_rate": 3.432685585951299e-06, "loss": 1.0624, "step": 13177 }, { "epoch": 0.4, "learning_rate": 3.4324592721266626e-06, "loss": 1.0806, "step": 13178 }, { "epoch": 0.4, "learning_rate": 3.4322329494254625e-06, "loss": 1.09, "step": 13179 }, { "epoch": 0.4, "learning_rate": 3.4320066178498545e-06, "loss": 1.1607, "step": 13180 }, { "epoch": 0.4, "learning_rate": 3.4317802774019915e-06, "loss": 1.0251, "step": 13181 }, { "epoch": 0.4, "learning_rate": 3.431553928084029e-06, "loss": 1.1533, "step": 13182 }, { "epoch": 0.4, "learning_rate": 3.4313275698981226e-06, "loss": 1.1762, "step": 13183 }, { "epoch": 0.4, "learning_rate": 3.431101202846425e-06, "loss": 1.1212, "step": 13184 }, { "epoch": 0.4, "learning_rate": 3.4308748269310938e-06, "loss": 1.0188, "step": 13185 }, { "epoch": 0.4, "learning_rate": 3.430648442154282e-06, "loss": 1.2032, "step": 13186 }, { "epoch": 0.4, "learning_rate": 3.4304220485181446e-06, "loss": 1.1606, "step": 13187 }, { "epoch": 0.4, "learning_rate": 3.4301956460248374e-06, "loss": 1.0953, "step": 13188 }, { "epoch": 0.4, "learning_rate": 3.429969234676517e-06, "loss": 1.0743, "step": 13189 }, { "epoch": 0.4, "learning_rate": 3.4297428144753363e-06, "loss": 1.1816, "step": 13190 }, { "epoch": 0.4, "learning_rate": 3.429516385423452e-06, "loss": 1.2112, "step": 13191 }, { "epoch": 0.4, "learning_rate": 3.429289947523019e-06, "loss": 1.0394, "step": 13192 }, { "epoch": 0.4, "learning_rate": 3.429063500776194e-06, "loss": 1.2973, "step": 13193 }, { "epoch": 0.4, "learning_rate": 3.4288370451851315e-06, "loss": 1.1227, "step": 13194 }, { "epoch": 0.4, "learning_rate": 3.428610580751988e-06, "loss": 1.0471, "step": 13195 }, { "epoch": 0.4, "learning_rate": 3.428384107478919e-06, "loss": 1.2012, "step": 13196 }, { "epoch": 0.4, "learning_rate": 3.42815762536808e-06, "loss": 1.1338, "step": 13197 }, { "epoch": 0.4, "learning_rate": 3.4279311344216275e-06, "loss": 1.165, "step": 13198 }, { "epoch": 0.4, "learning_rate": 3.4277046346417176e-06, "loss": 1.0981, "step": 13199 }, { "epoch": 0.4, "learning_rate": 3.4274781260305066e-06, "loss": 1.1855, "step": 13200 }, { "epoch": 0.4, "learning_rate": 3.4272516085901503e-06, "loss": 1.0825, "step": 13201 }, { "epoch": 0.4, "learning_rate": 3.4270250823228052e-06, "loss": 1.1985, "step": 13202 }, { "epoch": 0.4, "learning_rate": 3.4267985472306275e-06, "loss": 1.038, "step": 13203 }, { "epoch": 0.4, "learning_rate": 3.4265720033157744e-06, "loss": 1.266, "step": 13204 }, { "epoch": 0.4, "learning_rate": 3.4263454505804023e-06, "loss": 1.1946, "step": 13205 }, { "epoch": 0.4, "learning_rate": 3.426118889026668e-06, "loss": 1.0734, "step": 13206 }, { "epoch": 0.4, "learning_rate": 3.4258923186567266e-06, "loss": 1.1881, "step": 13207 }, { "epoch": 0.4, "learning_rate": 3.4256657394727376e-06, "loss": 1.1572, "step": 13208 }, { "epoch": 0.4, "learning_rate": 3.425439151476856e-06, "loss": 1.186, "step": 13209 }, { "epoch": 0.4, "learning_rate": 3.4252125546712387e-06, "loss": 1.1165, "step": 13210 }, { "epoch": 0.4, "learning_rate": 3.4249859490580446e-06, "loss": 1.2418, "step": 13211 }, { "epoch": 0.4, "learning_rate": 3.4247593346394293e-06, "loss": 1.1401, "step": 13212 }, { "epoch": 0.4, "learning_rate": 3.424532711417551e-06, "loss": 1.173, "step": 13213 }, { "epoch": 0.4, "learning_rate": 3.4243060793945654e-06, "loss": 1.2389, "step": 13214 }, { "epoch": 0.4, "learning_rate": 3.4240794385726317e-06, "loss": 1.1887, "step": 13215 }, { "epoch": 0.4, "learning_rate": 3.4238527889539063e-06, "loss": 1.1698, "step": 13216 }, { "epoch": 0.4, "learning_rate": 3.4236261305405483e-06, "loss": 1.2107, "step": 13217 }, { "epoch": 0.4, "learning_rate": 3.4233994633347135e-06, "loss": 1.2339, "step": 13218 }, { "epoch": 0.4, "learning_rate": 3.4231727873385614e-06, "loss": 1.1454, "step": 13219 }, { "epoch": 0.4, "learning_rate": 3.422946102554248e-06, "loss": 1.1583, "step": 13220 }, { "epoch": 0.4, "learning_rate": 3.4227194089839333e-06, "loss": 1.1323, "step": 13221 }, { "epoch": 0.4, "learning_rate": 3.422492706629773e-06, "loss": 1.0919, "step": 13222 }, { "epoch": 0.4, "learning_rate": 3.4222659954939276e-06, "loss": 1.1846, "step": 13223 }, { "epoch": 0.4, "learning_rate": 3.4220392755785534e-06, "loss": 1.2834, "step": 13224 }, { "epoch": 0.4, "learning_rate": 3.4218125468858093e-06, "loss": 1.0615, "step": 13225 }, { "epoch": 0.4, "learning_rate": 3.4215858094178546e-06, "loss": 1.1252, "step": 13226 }, { "epoch": 0.4, "learning_rate": 3.4213590631768455e-06, "loss": 1.0986, "step": 13227 }, { "epoch": 0.4, "learning_rate": 3.4211323081649428e-06, "loss": 1.1603, "step": 13228 }, { "epoch": 0.4, "learning_rate": 3.420905544384303e-06, "loss": 0.9957, "step": 13229 }, { "epoch": 0.4, "learning_rate": 3.420678771837088e-06, "loss": 1.3405, "step": 13230 }, { "epoch": 0.4, "learning_rate": 3.420451990525453e-06, "loss": 1.1025, "step": 13231 }, { "epoch": 0.4, "learning_rate": 3.4202252004515586e-06, "loss": 1.0943, "step": 13232 }, { "epoch": 0.4, "learning_rate": 3.4199984016175636e-06, "loss": 1.157, "step": 13233 }, { "epoch": 0.4, "learning_rate": 3.419771594025627e-06, "loss": 1.1241, "step": 13234 }, { "epoch": 0.4, "learning_rate": 3.4195447776779077e-06, "loss": 1.0722, "step": 13235 }, { "epoch": 0.4, "learning_rate": 3.4193179525765647e-06, "loss": 1.1823, "step": 13236 }, { "epoch": 0.4, "learning_rate": 3.419091118723758e-06, "loss": 1.2811, "step": 13237 }, { "epoch": 0.4, "learning_rate": 3.4188642761216462e-06, "loss": 1.1704, "step": 13238 }, { "epoch": 0.4, "learning_rate": 3.41863742477239e-06, "loss": 1.1491, "step": 13239 }, { "epoch": 0.4, "learning_rate": 3.4184105646781464e-06, "loss": 1.1528, "step": 13240 }, { "epoch": 0.4, "learning_rate": 3.4181836958410774e-06, "loss": 1.031, "step": 13241 }, { "epoch": 0.4, "learning_rate": 3.4179568182633417e-06, "loss": 1.1808, "step": 13242 }, { "epoch": 0.4, "learning_rate": 3.417729931947099e-06, "loss": 1.0583, "step": 13243 }, { "epoch": 0.4, "learning_rate": 3.4175030368945095e-06, "loss": 1.1576, "step": 13244 }, { "epoch": 0.4, "learning_rate": 3.4172761331077333e-06, "loss": 1.1506, "step": 13245 }, { "epoch": 0.4, "learning_rate": 3.4170492205889296e-06, "loss": 1.0964, "step": 13246 }, { "epoch": 0.4, "learning_rate": 3.416822299340259e-06, "loss": 1.168, "step": 13247 }, { "epoch": 0.4, "learning_rate": 3.416595369363882e-06, "loss": 1.144, "step": 13248 }, { "epoch": 0.4, "learning_rate": 3.4163684306619576e-06, "loss": 1.1993, "step": 13249 }, { "epoch": 0.4, "learning_rate": 3.4161414832366483e-06, "loss": 1.078, "step": 13250 }, { "epoch": 0.4, "learning_rate": 3.415914527090113e-06, "loss": 1.1087, "step": 13251 }, { "epoch": 0.4, "learning_rate": 3.415687562224512e-06, "loss": 1.0286, "step": 13252 }, { "epoch": 0.4, "learning_rate": 3.415460588642007e-06, "loss": 1.1291, "step": 13253 }, { "epoch": 0.4, "learning_rate": 3.415233606344758e-06, "loss": 1.1265, "step": 13254 }, { "epoch": 0.4, "learning_rate": 3.415006615334926e-06, "loss": 1.1765, "step": 13255 }, { "epoch": 0.4, "learning_rate": 3.414779615614671e-06, "loss": 1.1163, "step": 13256 }, { "epoch": 0.4, "learning_rate": 3.4145526071861546e-06, "loss": 1.0082, "step": 13257 }, { "epoch": 0.4, "learning_rate": 3.414325590051539e-06, "loss": 1.1179, "step": 13258 }, { "epoch": 0.4, "learning_rate": 3.414098564212983e-06, "loss": 1.0811, "step": 13259 }, { "epoch": 0.4, "learning_rate": 3.41387152967265e-06, "loss": 1.0844, "step": 13260 }, { "epoch": 0.4, "learning_rate": 3.4136444864326988e-06, "loss": 1.2817, "step": 13261 }, { "epoch": 0.4, "learning_rate": 3.413417434495293e-06, "loss": 1.1396, "step": 13262 }, { "epoch": 0.4, "learning_rate": 3.4131903738625933e-06, "loss": 1.145, "step": 13263 }, { "epoch": 0.4, "learning_rate": 3.4129633045367606e-06, "loss": 1.1012, "step": 13264 }, { "epoch": 0.4, "learning_rate": 3.412736226519957e-06, "loss": 1.0554, "step": 13265 }, { "epoch": 0.4, "learning_rate": 3.4125091398143444e-06, "loss": 1.209, "step": 13266 }, { "epoch": 0.4, "learning_rate": 3.4122820444220846e-06, "loss": 1.1269, "step": 13267 }, { "epoch": 0.4, "learning_rate": 3.412054940345338e-06, "loss": 1.0817, "step": 13268 }, { "epoch": 0.4, "learning_rate": 3.4118278275862683e-06, "loss": 1.0325, "step": 13269 }, { "epoch": 0.4, "learning_rate": 3.4116007061470363e-06, "loss": 1.0875, "step": 13270 }, { "epoch": 0.4, "learning_rate": 3.4113735760298057e-06, "loss": 1.1835, "step": 13271 }, { "epoch": 0.4, "learning_rate": 3.4111464372367364e-06, "loss": 1.1092, "step": 13272 }, { "epoch": 0.4, "learning_rate": 3.4109192897699926e-06, "loss": 1.14, "step": 13273 }, { "epoch": 0.4, "learning_rate": 3.4106921336317358e-06, "loss": 1.2495, "step": 13274 }, { "epoch": 0.4, "learning_rate": 3.410464968824128e-06, "loss": 1.0733, "step": 13275 }, { "epoch": 0.4, "learning_rate": 3.4102377953493324e-06, "loss": 1.0828, "step": 13276 }, { "epoch": 0.4, "learning_rate": 3.4100106132095117e-06, "loss": 1.0531, "step": 13277 }, { "epoch": 0.4, "learning_rate": 3.4097834224068284e-06, "loss": 1.1855, "step": 13278 }, { "epoch": 0.4, "learning_rate": 3.409556222943444e-06, "loss": 1.2194, "step": 13279 }, { "epoch": 0.4, "learning_rate": 3.4093290148215243e-06, "loss": 1.2396, "step": 13280 }, { "epoch": 0.4, "learning_rate": 3.4091017980432284e-06, "loss": 1.1202, "step": 13281 }, { "epoch": 0.4, "learning_rate": 3.4088745726107224e-06, "loss": 0.9875, "step": 13282 }, { "epoch": 0.4, "learning_rate": 3.4086473385261674e-06, "loss": 1.0741, "step": 13283 }, { "epoch": 0.4, "learning_rate": 3.408420095791728e-06, "loss": 1.1942, "step": 13284 }, { "epoch": 0.4, "learning_rate": 3.4081928444095664e-06, "loss": 1.138, "step": 13285 }, { "epoch": 0.4, "learning_rate": 3.4079655843818466e-06, "loss": 1.2538, "step": 13286 }, { "epoch": 0.4, "learning_rate": 3.407738315710731e-06, "loss": 1.0142, "step": 13287 }, { "epoch": 0.4, "learning_rate": 3.407511038398385e-06, "loss": 1.1654, "step": 13288 }, { "epoch": 0.4, "learning_rate": 3.4072837524469703e-06, "loss": 1.0969, "step": 13289 }, { "epoch": 0.4, "learning_rate": 3.407056457858651e-06, "loss": 1.162, "step": 13290 }, { "epoch": 0.4, "learning_rate": 3.4068291546355917e-06, "loss": 1.1261, "step": 13291 }, { "epoch": 0.4, "learning_rate": 3.4066018427799554e-06, "loss": 1.2355, "step": 13292 }, { "epoch": 0.4, "learning_rate": 3.4063745222939067e-06, "loss": 1.1506, "step": 13293 }, { "epoch": 0.4, "learning_rate": 3.406147193179608e-06, "loss": 1.1123, "step": 13294 }, { "epoch": 0.4, "learning_rate": 3.405919855439225e-06, "loss": 1.1639, "step": 13295 }, { "epoch": 0.4, "learning_rate": 3.4056925090749214e-06, "loss": 1.1317, "step": 13296 }, { "epoch": 0.4, "learning_rate": 3.4054651540888604e-06, "loss": 1.2368, "step": 13297 }, { "epoch": 0.4, "learning_rate": 3.405237790483208e-06, "loss": 1.2747, "step": 13298 }, { "epoch": 0.4, "learning_rate": 3.405010418260128e-06, "loss": 1.1825, "step": 13299 }, { "epoch": 0.4, "learning_rate": 3.4047830374217845e-06, "loss": 1.1375, "step": 13300 }, { "epoch": 0.4, "learning_rate": 3.4045556479703424e-06, "loss": 1.1425, "step": 13301 }, { "epoch": 0.4, "learning_rate": 3.4043282499079656e-06, "loss": 1.0815, "step": 13302 }, { "epoch": 0.4, "learning_rate": 3.4041008432368193e-06, "loss": 1.0814, "step": 13303 }, { "epoch": 0.4, "learning_rate": 3.4038734279590696e-06, "loss": 1.1367, "step": 13304 }, { "epoch": 0.4, "learning_rate": 3.403646004076879e-06, "loss": 1.0855, "step": 13305 }, { "epoch": 0.4, "learning_rate": 3.4034185715924144e-06, "loss": 1.19, "step": 13306 }, { "epoch": 0.4, "learning_rate": 3.4031911305078395e-06, "loss": 0.9985, "step": 13307 }, { "epoch": 0.4, "learning_rate": 3.4029636808253208e-06, "loss": 1.1305, "step": 13308 }, { "epoch": 0.4, "learning_rate": 3.402736222547022e-06, "loss": 1.1645, "step": 13309 }, { "epoch": 0.4, "learning_rate": 3.402508755675109e-06, "loss": 1.1346, "step": 13310 }, { "epoch": 0.4, "learning_rate": 3.402281280211748e-06, "loss": 1.1606, "step": 13311 }, { "epoch": 0.4, "learning_rate": 3.402053796159104e-06, "loss": 1.2241, "step": 13312 }, { "epoch": 0.4, "learning_rate": 3.401826303519341e-06, "loss": 1.084, "step": 13313 }, { "epoch": 0.4, "learning_rate": 3.401598802294627e-06, "loss": 1.1565, "step": 13314 }, { "epoch": 0.4, "learning_rate": 3.4013712924871263e-06, "loss": 1.0405, "step": 13315 }, { "epoch": 0.4, "learning_rate": 3.401143774099005e-06, "loss": 1.0034, "step": 13316 }, { "epoch": 0.4, "learning_rate": 3.400916247132429e-06, "loss": 1.1282, "step": 13317 }, { "epoch": 0.4, "learning_rate": 3.4006887115895643e-06, "loss": 1.0906, "step": 13318 }, { "epoch": 0.4, "learning_rate": 3.4004611674725768e-06, "loss": 1.0854, "step": 13319 }, { "epoch": 0.4, "learning_rate": 3.4002336147836324e-06, "loss": 1.0949, "step": 13320 }, { "epoch": 0.4, "learning_rate": 3.400006053524898e-06, "loss": 1.1213, "step": 13321 }, { "epoch": 0.4, "learning_rate": 3.399778483698539e-06, "loss": 1.0303, "step": 13322 }, { "epoch": 0.4, "learning_rate": 3.3995509053067226e-06, "loss": 1.1136, "step": 13323 }, { "epoch": 0.4, "learning_rate": 3.399323318351615e-06, "loss": 1.1439, "step": 13324 }, { "epoch": 0.4, "learning_rate": 3.3990957228353817e-06, "loss": 1.0303, "step": 13325 }, { "epoch": 0.4, "learning_rate": 3.398868118760191e-06, "loss": 1.0635, "step": 13326 }, { "epoch": 0.4, "learning_rate": 3.398640506128208e-06, "loss": 1.0492, "step": 13327 }, { "epoch": 0.4, "learning_rate": 3.3984128849416005e-06, "loss": 1.1901, "step": 13328 }, { "epoch": 0.4, "learning_rate": 3.3981852552025352e-06, "loss": 1.2225, "step": 13329 }, { "epoch": 0.4, "learning_rate": 3.397957616913179e-06, "loss": 1.0745, "step": 13330 }, { "epoch": 0.4, "learning_rate": 3.397729970075698e-06, "loss": 1.1536, "step": 13331 }, { "epoch": 0.4, "learning_rate": 3.3975023146922608e-06, "loss": 1.1691, "step": 13332 }, { "epoch": 0.4, "learning_rate": 3.397274650765033e-06, "loss": 1.2017, "step": 13333 }, { "epoch": 0.4, "learning_rate": 3.3970469782961835e-06, "loss": 1.0998, "step": 13334 }, { "epoch": 0.4, "learning_rate": 3.3968192972878784e-06, "loss": 1.1387, "step": 13335 }, { "epoch": 0.4, "learning_rate": 3.3965916077422863e-06, "loss": 1.3058, "step": 13336 }, { "epoch": 0.4, "learning_rate": 3.396363909661573e-06, "loss": 1.1462, "step": 13337 }, { "epoch": 0.4, "learning_rate": 3.3961362030479066e-06, "loss": 1.1739, "step": 13338 }, { "epoch": 0.4, "learning_rate": 3.3959084879034554e-06, "loss": 1.0863, "step": 13339 }, { "epoch": 0.4, "learning_rate": 3.395680764230388e-06, "loss": 1.1124, "step": 13340 }, { "epoch": 0.4, "learning_rate": 3.39545303203087e-06, "loss": 1.1901, "step": 13341 }, { "epoch": 0.4, "learning_rate": 3.3952252913070703e-06, "loss": 1.2205, "step": 13342 }, { "epoch": 0.4, "learning_rate": 3.3949975420611573e-06, "loss": 1.2812, "step": 13343 }, { "epoch": 0.4, "learning_rate": 3.3947697842952987e-06, "loss": 1.1754, "step": 13344 }, { "epoch": 0.4, "learning_rate": 3.3945420180116632e-06, "loss": 1.0326, "step": 13345 }, { "epoch": 0.4, "learning_rate": 3.394314243212418e-06, "loss": 1.0891, "step": 13346 }, { "epoch": 0.4, "learning_rate": 3.3940864598997323e-06, "loss": 1.1075, "step": 13347 }, { "epoch": 0.4, "learning_rate": 3.393858668075774e-06, "loss": 1.0717, "step": 13348 }, { "epoch": 0.4, "learning_rate": 3.3936308677427122e-06, "loss": 1.2943, "step": 13349 }, { "epoch": 0.4, "learning_rate": 3.3934030589027134e-06, "loss": 1.0706, "step": 13350 }, { "epoch": 0.4, "learning_rate": 3.393175241557949e-06, "loss": 1.1583, "step": 13351 }, { "epoch": 0.4, "learning_rate": 3.3929474157105856e-06, "loss": 1.0883, "step": 13352 }, { "epoch": 0.4, "learning_rate": 3.3927195813627934e-06, "loss": 1.1519, "step": 13353 }, { "epoch": 0.4, "learning_rate": 3.3924917385167405e-06, "loss": 1.1126, "step": 13354 }, { "epoch": 0.4, "learning_rate": 3.392263887174596e-06, "loss": 1.1887, "step": 13355 }, { "epoch": 0.4, "learning_rate": 3.39203602733853e-06, "loss": 1.1735, "step": 13356 }, { "epoch": 0.4, "learning_rate": 3.39180815901071e-06, "loss": 1.0269, "step": 13357 }, { "epoch": 0.4, "learning_rate": 3.3915802821933057e-06, "loss": 1.1639, "step": 13358 }, { "epoch": 0.4, "learning_rate": 3.3913523968884867e-06, "loss": 1.1789, "step": 13359 }, { "epoch": 0.4, "learning_rate": 3.391124503098422e-06, "loss": 1.1574, "step": 13360 }, { "epoch": 0.4, "learning_rate": 3.3908966008252807e-06, "loss": 1.2255, "step": 13361 }, { "epoch": 0.4, "learning_rate": 3.390668690071234e-06, "loss": 1.1923, "step": 13362 }, { "epoch": 0.4, "learning_rate": 3.3904407708384496e-06, "loss": 1.1597, "step": 13363 }, { "epoch": 0.4, "learning_rate": 3.3902128431290983e-06, "loss": 1.2268, "step": 13364 }, { "epoch": 0.4, "learning_rate": 3.3899849069453496e-06, "loss": 1.0294, "step": 13365 }, { "epoch": 0.4, "learning_rate": 3.3897569622893724e-06, "loss": 1.0811, "step": 13366 }, { "epoch": 0.4, "learning_rate": 3.3895290091633376e-06, "loss": 1.0883, "step": 13367 }, { "epoch": 0.4, "learning_rate": 3.389301047569415e-06, "loss": 1.1575, "step": 13368 }, { "epoch": 0.4, "learning_rate": 3.3890730775097753e-06, "loss": 1.212, "step": 13369 }, { "epoch": 0.4, "learning_rate": 3.3888450989865875e-06, "loss": 1.044, "step": 13370 }, { "epoch": 0.4, "learning_rate": 3.3886171120020234e-06, "loss": 1.1609, "step": 13371 }, { "epoch": 0.4, "learning_rate": 3.388389116558252e-06, "loss": 1.0839, "step": 13372 }, { "epoch": 0.4, "learning_rate": 3.3881611126574432e-06, "loss": 1.2251, "step": 13373 }, { "epoch": 0.4, "learning_rate": 3.387933100301769e-06, "loss": 1.1084, "step": 13374 }, { "epoch": 0.4, "learning_rate": 3.3877050794933997e-06, "loss": 1.2268, "step": 13375 }, { "epoch": 0.4, "learning_rate": 3.387477050234505e-06, "loss": 1.1581, "step": 13376 }, { "epoch": 0.4, "learning_rate": 3.3872490125272567e-06, "loss": 1.2279, "step": 13377 }, { "epoch": 0.4, "learning_rate": 3.3870209663738244e-06, "loss": 1.0444, "step": 13378 }, { "epoch": 0.4, "learning_rate": 3.38679291177638e-06, "loss": 1.1555, "step": 13379 }, { "epoch": 0.4, "learning_rate": 3.386564848737094e-06, "loss": 1.0876, "step": 13380 }, { "epoch": 0.4, "learning_rate": 3.3863367772581384e-06, "loss": 1.111, "step": 13381 }, { "epoch": 0.4, "learning_rate": 3.386108697341683e-06, "loss": 1.1911, "step": 13382 }, { "epoch": 0.4, "learning_rate": 3.3858806089898995e-06, "loss": 1.1381, "step": 13383 }, { "epoch": 0.4, "learning_rate": 3.3856525122049593e-06, "loss": 1.1522, "step": 13384 }, { "epoch": 0.4, "learning_rate": 3.3854244069890342e-06, "loss": 0.9037, "step": 13385 }, { "epoch": 0.4, "learning_rate": 3.385196293344295e-06, "loss": 1.1574, "step": 13386 }, { "epoch": 0.4, "learning_rate": 3.384968171272913e-06, "loss": 1.1324, "step": 13387 }, { "epoch": 0.4, "learning_rate": 3.3847400407770603e-06, "loss": 1.2072, "step": 13388 }, { "epoch": 0.4, "learning_rate": 3.384511901858909e-06, "loss": 1.1722, "step": 13389 }, { "epoch": 0.4, "learning_rate": 3.3842837545206297e-06, "loss": 1.0923, "step": 13390 }, { "epoch": 0.4, "learning_rate": 3.384055598764395e-06, "loss": 1.071, "step": 13391 }, { "epoch": 0.4, "learning_rate": 3.383827434592377e-06, "loss": 1.2811, "step": 13392 }, { "epoch": 0.4, "learning_rate": 3.3835992620067476e-06, "loss": 1.1524, "step": 13393 }, { "epoch": 0.4, "learning_rate": 3.3833710810096787e-06, "loss": 1.1885, "step": 13394 }, { "epoch": 0.4, "learning_rate": 3.3831428916033425e-06, "loss": 1.0879, "step": 13395 }, { "epoch": 0.4, "learning_rate": 3.3829146937899117e-06, "loss": 1.1008, "step": 13396 }, { "epoch": 0.4, "learning_rate": 3.382686487571558e-06, "loss": 1.1545, "step": 13397 }, { "epoch": 0.4, "learning_rate": 3.382458272950454e-06, "loss": 1.046, "step": 13398 }, { "epoch": 0.4, "learning_rate": 3.3822300499287725e-06, "loss": 1.1893, "step": 13399 }, { "epoch": 0.4, "learning_rate": 3.3820018185086852e-06, "loss": 1.079, "step": 13400 }, { "epoch": 0.4, "learning_rate": 3.381773578692366e-06, "loss": 1.142, "step": 13401 }, { "epoch": 0.4, "learning_rate": 3.3815453304819868e-06, "loss": 1.1209, "step": 13402 }, { "epoch": 0.4, "learning_rate": 3.381317073879721e-06, "loss": 1.0624, "step": 13403 }, { "epoch": 0.4, "learning_rate": 3.3810888088877403e-06, "loss": 1.2266, "step": 13404 }, { "epoch": 0.4, "learning_rate": 3.3808605355082187e-06, "loss": 1.0762, "step": 13405 }, { "epoch": 0.4, "learning_rate": 3.380632253743329e-06, "loss": 1.1876, "step": 13406 }, { "epoch": 0.4, "learning_rate": 3.3804039635952447e-06, "loss": 1.2363, "step": 13407 }, { "epoch": 0.4, "learning_rate": 3.3801756650661384e-06, "loss": 1.1154, "step": 13408 }, { "epoch": 0.4, "learning_rate": 3.379947358158183e-06, "loss": 1.0851, "step": 13409 }, { "epoch": 0.4, "learning_rate": 3.3797190428735542e-06, "loss": 1.2532, "step": 13410 }, { "epoch": 0.4, "learning_rate": 3.379490719214423e-06, "loss": 1.2546, "step": 13411 }, { "epoch": 0.4, "learning_rate": 3.379262387182964e-06, "loss": 1.2504, "step": 13412 }, { "epoch": 0.4, "learning_rate": 3.37903404678135e-06, "loss": 1.2216, "step": 13413 }, { "epoch": 0.4, "learning_rate": 3.3788056980117554e-06, "loss": 1.2076, "step": 13414 }, { "epoch": 0.4, "learning_rate": 3.378577340876354e-06, "loss": 1.2679, "step": 13415 }, { "epoch": 0.4, "learning_rate": 3.3783489753773195e-06, "loss": 1.0724, "step": 13416 }, { "epoch": 0.4, "learning_rate": 3.3781206015168256e-06, "loss": 1.1436, "step": 13417 }, { "epoch": 0.4, "learning_rate": 3.3778922192970465e-06, "loss": 1.1007, "step": 13418 }, { "epoch": 0.4, "learning_rate": 3.3776638287201562e-06, "loss": 1.1931, "step": 13419 }, { "epoch": 0.4, "learning_rate": 3.3774354297883286e-06, "loss": 1.1165, "step": 13420 }, { "epoch": 0.4, "learning_rate": 3.377207022503739e-06, "loss": 1.1268, "step": 13421 }, { "epoch": 0.4, "learning_rate": 3.3769786068685604e-06, "loss": 1.0305, "step": 13422 }, { "epoch": 0.4, "learning_rate": 3.3767501828849685e-06, "loss": 1.1814, "step": 13423 }, { "epoch": 0.4, "learning_rate": 3.3765217505551366e-06, "loss": 1.1679, "step": 13424 }, { "epoch": 0.4, "learning_rate": 3.37629330988124e-06, "loss": 1.1333, "step": 13425 }, { "epoch": 0.4, "learning_rate": 3.3760648608654535e-06, "loss": 1.2, "step": 13426 }, { "epoch": 0.4, "learning_rate": 3.375836403509951e-06, "loss": 1.122, "step": 13427 }, { "epoch": 0.4, "learning_rate": 3.3756079378169076e-06, "loss": 1.1411, "step": 13428 }, { "epoch": 0.4, "learning_rate": 3.375379463788499e-06, "loss": 0.9943, "step": 13429 }, { "epoch": 0.4, "learning_rate": 3.375150981426899e-06, "loss": 1.1017, "step": 13430 }, { "epoch": 0.4, "learning_rate": 3.3749224907342837e-06, "loss": 1.1968, "step": 13431 }, { "epoch": 0.4, "learning_rate": 3.3746939917128265e-06, "loss": 1.0461, "step": 13432 }, { "epoch": 0.4, "learning_rate": 3.3744654843647042e-06, "loss": 1.1428, "step": 13433 }, { "epoch": 0.4, "learning_rate": 3.3742369686920916e-06, "loss": 1.1072, "step": 13434 }, { "epoch": 0.4, "learning_rate": 3.3740084446971644e-06, "loss": 1.2136, "step": 13435 }, { "epoch": 0.4, "learning_rate": 3.373779912382098e-06, "loss": 1.1401, "step": 13436 }, { "epoch": 0.4, "learning_rate": 3.3735513717490677e-06, "loss": 1.1107, "step": 13437 }, { "epoch": 0.4, "learning_rate": 3.3733228228002483e-06, "loss": 1.093, "step": 13438 }, { "epoch": 0.4, "learning_rate": 3.373094265537817e-06, "loss": 1.1361, "step": 13439 }, { "epoch": 0.4, "learning_rate": 3.3728656999639486e-06, "loss": 1.1077, "step": 13440 }, { "epoch": 0.4, "learning_rate": 3.3726371260808187e-06, "loss": 1.2507, "step": 13441 }, { "epoch": 0.4, "learning_rate": 3.372408543890604e-06, "loss": 1.0823, "step": 13442 }, { "epoch": 0.4, "learning_rate": 3.3721799533954802e-06, "loss": 1.1115, "step": 13443 }, { "epoch": 0.41, "learning_rate": 3.3719513545976233e-06, "loss": 1.0919, "step": 13444 }, { "epoch": 0.41, "learning_rate": 3.3717227474992093e-06, "loss": 1.1293, "step": 13445 }, { "epoch": 0.41, "learning_rate": 3.371494132102414e-06, "loss": 1.1711, "step": 13446 }, { "epoch": 0.41, "learning_rate": 3.3712655084094155e-06, "loss": 1.0965, "step": 13447 }, { "epoch": 0.41, "learning_rate": 3.371036876422388e-06, "loss": 1.1512, "step": 13448 }, { "epoch": 0.41, "learning_rate": 3.370808236143509e-06, "loss": 1.2038, "step": 13449 }, { "epoch": 0.41, "learning_rate": 3.370579587574955e-06, "loss": 1.1855, "step": 13450 }, { "epoch": 0.41, "learning_rate": 3.3703509307189036e-06, "loss": 1.1822, "step": 13451 }, { "epoch": 0.41, "learning_rate": 3.3701222655775294e-06, "loss": 1.1879, "step": 13452 }, { "epoch": 0.41, "learning_rate": 3.369893592153011e-06, "loss": 1.2003, "step": 13453 }, { "epoch": 0.41, "learning_rate": 3.3696649104475244e-06, "loss": 1.0402, "step": 13454 }, { "epoch": 0.41, "learning_rate": 3.369436220463247e-06, "loss": 1.167, "step": 13455 }, { "epoch": 0.41, "learning_rate": 3.3692075222023547e-06, "loss": 1.1839, "step": 13456 }, { "epoch": 0.41, "learning_rate": 3.368978815667026e-06, "loss": 1.0717, "step": 13457 }, { "epoch": 0.41, "learning_rate": 3.368750100859437e-06, "loss": 1.114, "step": 13458 }, { "epoch": 0.41, "learning_rate": 3.368521377781766e-06, "loss": 1.1646, "step": 13459 }, { "epoch": 0.41, "learning_rate": 3.368292646436189e-06, "loss": 1.2875, "step": 13460 }, { "epoch": 0.41, "learning_rate": 3.368063906824885e-06, "loss": 1.2069, "step": 13461 }, { "epoch": 0.41, "learning_rate": 3.36783515895003e-06, "loss": 1.2393, "step": 13462 }, { "epoch": 0.41, "learning_rate": 3.367606402813802e-06, "loss": 1.1746, "step": 13463 }, { "epoch": 0.41, "learning_rate": 3.36737763841838e-06, "loss": 1.0947, "step": 13464 }, { "epoch": 0.41, "learning_rate": 3.36714886576594e-06, "loss": 1.1276, "step": 13465 }, { "epoch": 0.41, "learning_rate": 3.3669200848586613e-06, "loss": 1.1703, "step": 13466 }, { "epoch": 0.41, "learning_rate": 3.3666912956987198e-06, "loss": 1.2055, "step": 13467 }, { "epoch": 0.41, "learning_rate": 3.3664624982882953e-06, "loss": 1.2019, "step": 13468 }, { "epoch": 0.41, "learning_rate": 3.3662336926295647e-06, "loss": 1.1453, "step": 13469 }, { "epoch": 0.41, "learning_rate": 3.3660048787247067e-06, "loss": 1.1703, "step": 13470 }, { "epoch": 0.41, "learning_rate": 3.365776056575899e-06, "loss": 1.1131, "step": 13471 }, { "epoch": 0.41, "learning_rate": 3.3655472261853213e-06, "loss": 1.0697, "step": 13472 }, { "epoch": 0.41, "learning_rate": 3.3653183875551497e-06, "loss": 1.0984, "step": 13473 }, { "epoch": 0.41, "learning_rate": 3.3650895406875637e-06, "loss": 1.114, "step": 13474 }, { "epoch": 0.41, "learning_rate": 3.364860685584742e-06, "loss": 1.1841, "step": 13475 }, { "epoch": 0.41, "learning_rate": 3.3646318222488633e-06, "loss": 1.0691, "step": 13476 }, { "epoch": 0.41, "learning_rate": 3.364402950682107e-06, "loss": 0.996, "step": 13477 }, { "epoch": 0.41, "learning_rate": 3.36417407088665e-06, "loss": 1.0586, "step": 13478 }, { "epoch": 0.41, "learning_rate": 3.3639451828646723e-06, "loss": 1.1009, "step": 13479 }, { "epoch": 0.41, "learning_rate": 3.363716286618352e-06, "loss": 1.2298, "step": 13480 }, { "epoch": 0.41, "learning_rate": 3.3634873821498696e-06, "loss": 1.2118, "step": 13481 }, { "epoch": 0.41, "learning_rate": 3.363258469461402e-06, "loss": 1.01, "step": 13482 }, { "epoch": 0.41, "learning_rate": 3.3630295485551313e-06, "loss": 1.1282, "step": 13483 }, { "epoch": 0.41, "learning_rate": 3.3628006194332337e-06, "loss": 1.1766, "step": 13484 }, { "epoch": 0.41, "learning_rate": 3.3625716820978897e-06, "loss": 1.2213, "step": 13485 }, { "epoch": 0.41, "learning_rate": 3.362342736551279e-06, "loss": 1.1365, "step": 13486 }, { "epoch": 0.41, "learning_rate": 3.36211378279558e-06, "loss": 1.223, "step": 13487 }, { "epoch": 0.41, "learning_rate": 3.3618848208329747e-06, "loss": 1.1477, "step": 13488 }, { "epoch": 0.41, "learning_rate": 3.3616558506656392e-06, "loss": 1.0653, "step": 13489 }, { "epoch": 0.41, "learning_rate": 3.3614268722957553e-06, "loss": 1.1066, "step": 13490 }, { "epoch": 0.41, "learning_rate": 3.3611978857255036e-06, "loss": 1.1211, "step": 13491 }, { "epoch": 0.41, "learning_rate": 3.3609688909570622e-06, "loss": 1.1057, "step": 13492 }, { "epoch": 0.41, "learning_rate": 3.360739887992611e-06, "loss": 1.0656, "step": 13493 }, { "epoch": 0.41, "learning_rate": 3.360510876834332e-06, "loss": 1.1227, "step": 13494 }, { "epoch": 0.41, "learning_rate": 3.3602818574844024e-06, "loss": 1.0872, "step": 13495 }, { "epoch": 0.41, "learning_rate": 3.3600528299450047e-06, "loss": 1.1631, "step": 13496 }, { "epoch": 0.41, "learning_rate": 3.3598237942183182e-06, "loss": 1.0946, "step": 13497 }, { "epoch": 0.41, "learning_rate": 3.3595947503065236e-06, "loss": 0.9503, "step": 13498 }, { "epoch": 0.41, "learning_rate": 3.3593656982118e-06, "loss": 1.02, "step": 13499 }, { "epoch": 0.41, "learning_rate": 3.35913663793633e-06, "loss": 1.1342, "step": 13500 }, { "epoch": 0.41, "learning_rate": 3.3589075694822916e-06, "loss": 1.1108, "step": 13501 }, { "epoch": 0.41, "learning_rate": 3.3586784928518674e-06, "loss": 1.127, "step": 13502 }, { "epoch": 0.41, "learning_rate": 3.3584494080472373e-06, "loss": 1.0761, "step": 13503 }, { "epoch": 0.41, "learning_rate": 3.358220315070583e-06, "loss": 1.0953, "step": 13504 }, { "epoch": 0.41, "learning_rate": 3.3579912139240846e-06, "loss": 1.155, "step": 13505 }, { "epoch": 0.41, "learning_rate": 3.3577621046099218e-06, "loss": 1.0305, "step": 13506 }, { "epoch": 0.41, "learning_rate": 3.3575329871302787e-06, "loss": 1.2662, "step": 13507 }, { "epoch": 0.41, "learning_rate": 3.357303861487333e-06, "loss": 1.0782, "step": 13508 }, { "epoch": 0.41, "learning_rate": 3.3570747276832684e-06, "loss": 1.1178, "step": 13509 }, { "epoch": 0.41, "learning_rate": 3.3568455857202646e-06, "loss": 1.1706, "step": 13510 }, { "epoch": 0.41, "learning_rate": 3.356616435600504e-06, "loss": 1.1923, "step": 13511 }, { "epoch": 0.41, "learning_rate": 3.3563872773261675e-06, "loss": 1.1638, "step": 13512 }, { "epoch": 0.41, "learning_rate": 3.356158110899437e-06, "loss": 1.1497, "step": 13513 }, { "epoch": 0.41, "learning_rate": 3.3559289363224924e-06, "loss": 1.2426, "step": 13514 }, { "epoch": 0.41, "learning_rate": 3.3556997535975167e-06, "loss": 1.1464, "step": 13515 }, { "epoch": 0.41, "learning_rate": 3.3554705627266916e-06, "loss": 1.1197, "step": 13516 }, { "epoch": 0.41, "learning_rate": 3.3552413637121987e-06, "loss": 1.0822, "step": 13517 }, { "epoch": 0.41, "learning_rate": 3.3550121565562204e-06, "loss": 1.2084, "step": 13518 }, { "epoch": 0.41, "learning_rate": 3.3547829412609377e-06, "loss": 1.1492, "step": 13519 }, { "epoch": 0.41, "learning_rate": 3.3545537178285343e-06, "loss": 1.1205, "step": 13520 }, { "epoch": 0.41, "learning_rate": 3.3543244862611897e-06, "loss": 1.059, "step": 13521 }, { "epoch": 0.41, "learning_rate": 3.3540952465610883e-06, "loss": 1.2195, "step": 13522 }, { "epoch": 0.41, "learning_rate": 3.353865998730411e-06, "loss": 1.0473, "step": 13523 }, { "epoch": 0.41, "learning_rate": 3.353636742771341e-06, "loss": 1.1906, "step": 13524 }, { "epoch": 0.41, "learning_rate": 3.353407478686059e-06, "loss": 1.0538, "step": 13525 }, { "epoch": 0.41, "learning_rate": 3.353178206476751e-06, "loss": 1.1283, "step": 13526 }, { "epoch": 0.41, "learning_rate": 3.352948926145596e-06, "loss": 1.2272, "step": 13527 }, { "epoch": 0.41, "learning_rate": 3.352719637694778e-06, "loss": 1.1738, "step": 13528 }, { "epoch": 0.41, "learning_rate": 3.3524903411264803e-06, "loss": 1.1375, "step": 13529 }, { "epoch": 0.41, "learning_rate": 3.352261036442884e-06, "loss": 1.2032, "step": 13530 }, { "epoch": 0.41, "learning_rate": 3.352031723646174e-06, "loss": 1.0922, "step": 13531 }, { "epoch": 0.41, "learning_rate": 3.351802402738532e-06, "loss": 1.0819, "step": 13532 }, { "epoch": 0.41, "learning_rate": 3.351573073722142e-06, "loss": 1.1781, "step": 13533 }, { "epoch": 0.41, "learning_rate": 3.3513437365991863e-06, "loss": 1.159, "step": 13534 }, { "epoch": 0.41, "learning_rate": 3.351114391371848e-06, "loss": 1.1426, "step": 13535 }, { "epoch": 0.41, "learning_rate": 3.3508850380423107e-06, "loss": 1.1613, "step": 13536 }, { "epoch": 0.41, "learning_rate": 3.3506556766127577e-06, "loss": 1.0342, "step": 13537 }, { "epoch": 0.41, "learning_rate": 3.350426307085372e-06, "loss": 1.0474, "step": 13538 }, { "epoch": 0.41, "learning_rate": 3.350196929462338e-06, "loss": 1.101, "step": 13539 }, { "epoch": 0.41, "learning_rate": 3.3499675437458386e-06, "loss": 1.184, "step": 13540 }, { "epoch": 0.41, "learning_rate": 3.3497381499380565e-06, "loss": 1.173, "step": 13541 }, { "epoch": 0.41, "learning_rate": 3.349508748041178e-06, "loss": 1.0352, "step": 13542 }, { "epoch": 0.41, "learning_rate": 3.349279338057384e-06, "loss": 1.2174, "step": 13543 }, { "epoch": 0.41, "learning_rate": 3.3490499199888605e-06, "loss": 1.059, "step": 13544 }, { "epoch": 0.41, "learning_rate": 3.3488204938377907e-06, "loss": 1.1484, "step": 13545 }, { "epoch": 0.41, "learning_rate": 3.3485910596063586e-06, "loss": 1.1479, "step": 13546 }, { "epoch": 0.41, "learning_rate": 3.3483616172967474e-06, "loss": 1.0712, "step": 13547 }, { "epoch": 0.41, "learning_rate": 3.3481321669111434e-06, "loss": 1.1406, "step": 13548 }, { "epoch": 0.41, "learning_rate": 3.347902708451729e-06, "loss": 1.195, "step": 13549 }, { "epoch": 0.41, "learning_rate": 3.3476732419206896e-06, "loss": 1.1292, "step": 13550 }, { "epoch": 0.41, "learning_rate": 3.3474437673202085e-06, "loss": 1.0306, "step": 13551 }, { "epoch": 0.41, "learning_rate": 3.3472142846524725e-06, "loss": 1.145, "step": 13552 }, { "epoch": 0.41, "learning_rate": 3.346984793919663e-06, "loss": 1.1001, "step": 13553 }, { "epoch": 0.41, "learning_rate": 3.3467552951239667e-06, "loss": 1.138, "step": 13554 }, { "epoch": 0.41, "learning_rate": 3.346525788267567e-06, "loss": 1.1459, "step": 13555 }, { "epoch": 0.41, "learning_rate": 3.3462962733526507e-06, "loss": 1.1909, "step": 13556 }, { "epoch": 0.41, "learning_rate": 3.3460667503814e-06, "loss": 1.1926, "step": 13557 }, { "epoch": 0.41, "learning_rate": 3.3458372193560023e-06, "loss": 1.1949, "step": 13558 }, { "epoch": 0.41, "learning_rate": 3.3456076802786418e-06, "loss": 1.1543, "step": 13559 }, { "epoch": 0.41, "learning_rate": 3.3453781331515032e-06, "loss": 1.1672, "step": 13560 }, { "epoch": 0.41, "learning_rate": 3.3451485779767724e-06, "loss": 1.1769, "step": 13561 }, { "epoch": 0.41, "learning_rate": 3.3449190147566334e-06, "loss": 1.1567, "step": 13562 }, { "epoch": 0.41, "learning_rate": 3.344689443493273e-06, "loss": 1.1207, "step": 13563 }, { "epoch": 0.41, "learning_rate": 3.3444598641888752e-06, "loss": 1.0082, "step": 13564 }, { "epoch": 0.41, "learning_rate": 3.344230276845627e-06, "loss": 1.0852, "step": 13565 }, { "epoch": 0.41, "learning_rate": 3.344000681465712e-06, "loss": 1.1243, "step": 13566 }, { "epoch": 0.41, "learning_rate": 3.3437710780513183e-06, "loss": 1.2344, "step": 13567 }, { "epoch": 0.41, "learning_rate": 3.3435414666046296e-06, "loss": 1.2616, "step": 13568 }, { "epoch": 0.41, "learning_rate": 3.3433118471278326e-06, "loss": 1.2651, "step": 13569 }, { "epoch": 0.41, "learning_rate": 3.343082219623113e-06, "loss": 1.1456, "step": 13570 }, { "epoch": 0.41, "learning_rate": 3.3428525840926562e-06, "loss": 1.1747, "step": 13571 }, { "epoch": 0.41, "learning_rate": 3.342622940538649e-06, "loss": 1.1849, "step": 13572 }, { "epoch": 0.41, "learning_rate": 3.342393288963277e-06, "loss": 1.1105, "step": 13573 }, { "epoch": 0.41, "learning_rate": 3.3421636293687275e-06, "loss": 1.2181, "step": 13574 }, { "epoch": 0.41, "learning_rate": 3.341933961757185e-06, "loss": 1.1926, "step": 13575 }, { "epoch": 0.41, "learning_rate": 3.3417042861308376e-06, "loss": 1.095, "step": 13576 }, { "epoch": 0.41, "learning_rate": 3.34147460249187e-06, "loss": 1.1272, "step": 13577 }, { "epoch": 0.41, "learning_rate": 3.3412449108424695e-06, "loss": 1.1195, "step": 13578 }, { "epoch": 0.41, "learning_rate": 3.3410152111848227e-06, "loss": 1.1477, "step": 13579 }, { "epoch": 0.41, "learning_rate": 3.340785503521116e-06, "loss": 1.004, "step": 13580 }, { "epoch": 0.41, "learning_rate": 3.3405557878535365e-06, "loss": 1.2321, "step": 13581 }, { "epoch": 0.41, "learning_rate": 3.3403260641842704e-06, "loss": 1.1039, "step": 13582 }, { "epoch": 0.41, "learning_rate": 3.3400963325155058e-06, "loss": 1.0716, "step": 13583 }, { "epoch": 0.41, "learning_rate": 3.3398665928494274e-06, "loss": 0.9949, "step": 13584 }, { "epoch": 0.41, "learning_rate": 3.3396368451882237e-06, "loss": 1.1141, "step": 13585 }, { "epoch": 0.41, "learning_rate": 3.3394070895340817e-06, "loss": 1.2484, "step": 13586 }, { "epoch": 0.41, "learning_rate": 3.3391773258891897e-06, "loss": 1.2073, "step": 13587 }, { "epoch": 0.41, "learning_rate": 3.3389475542557326e-06, "loss": 1.0826, "step": 13588 }, { "epoch": 0.41, "learning_rate": 3.3387177746358988e-06, "loss": 1.0333, "step": 13589 }, { "epoch": 0.41, "learning_rate": 3.3384879870318764e-06, "loss": 1.1254, "step": 13590 }, { "epoch": 0.41, "learning_rate": 3.3382581914458522e-06, "loss": 0.9973, "step": 13591 }, { "epoch": 0.41, "learning_rate": 3.338028387880013e-06, "loss": 1.2757, "step": 13592 }, { "epoch": 0.41, "learning_rate": 3.3377985763365477e-06, "loss": 1.0663, "step": 13593 }, { "epoch": 0.41, "learning_rate": 3.337568756817643e-06, "loss": 0.9921, "step": 13594 }, { "epoch": 0.41, "learning_rate": 3.337338929325487e-06, "loss": 1.1827, "step": 13595 }, { "epoch": 0.41, "learning_rate": 3.3371090938622686e-06, "loss": 1.1663, "step": 13596 }, { "epoch": 0.41, "learning_rate": 3.336879250430174e-06, "loss": 1.1044, "step": 13597 }, { "epoch": 0.41, "learning_rate": 3.336649399031392e-06, "loss": 1.1277, "step": 13598 }, { "epoch": 0.41, "learning_rate": 3.336419539668111e-06, "loss": 1.1132, "step": 13599 }, { "epoch": 0.41, "learning_rate": 3.336189672342519e-06, "loss": 1.1026, "step": 13600 }, { "epoch": 0.41, "learning_rate": 3.335959797056804e-06, "loss": 1.1508, "step": 13601 }, { "epoch": 0.41, "learning_rate": 3.335729913813154e-06, "loss": 1.197, "step": 13602 }, { "epoch": 0.41, "learning_rate": 3.3355000226137575e-06, "loss": 1.1175, "step": 13603 }, { "epoch": 0.41, "learning_rate": 3.3352701234608035e-06, "loss": 1.164, "step": 13604 }, { "epoch": 0.41, "learning_rate": 3.3350402163564798e-06, "loss": 1.0899, "step": 13605 }, { "epoch": 0.41, "learning_rate": 3.3348103013029763e-06, "loss": 1.1204, "step": 13606 }, { "epoch": 0.41, "learning_rate": 3.33458037830248e-06, "loss": 1.2388, "step": 13607 }, { "epoch": 0.41, "learning_rate": 3.334350447357181e-06, "loss": 1.139, "step": 13608 }, { "epoch": 0.41, "learning_rate": 3.3341205084692675e-06, "loss": 1.1727, "step": 13609 }, { "epoch": 0.41, "learning_rate": 3.3338905616409277e-06, "loss": 1.1639, "step": 13610 }, { "epoch": 0.41, "learning_rate": 3.3336606068743523e-06, "loss": 1.1589, "step": 13611 }, { "epoch": 0.41, "learning_rate": 3.333430644171729e-06, "loss": 1.122, "step": 13612 }, { "epoch": 0.41, "learning_rate": 3.3332006735352472e-06, "loss": 1.1958, "step": 13613 }, { "epoch": 0.41, "learning_rate": 3.3329706949670964e-06, "loss": 1.0426, "step": 13614 }, { "epoch": 0.41, "learning_rate": 3.3327407084694665e-06, "loss": 1.1425, "step": 13615 }, { "epoch": 0.41, "learning_rate": 3.332510714044545e-06, "loss": 1.0942, "step": 13616 }, { "epoch": 0.41, "learning_rate": 3.3322807116945233e-06, "loss": 1.1105, "step": 13617 }, { "epoch": 0.41, "learning_rate": 3.3320507014215895e-06, "loss": 1.1187, "step": 13618 }, { "epoch": 0.41, "learning_rate": 3.3318206832279342e-06, "loss": 1.136, "step": 13619 }, { "epoch": 0.41, "learning_rate": 3.3315906571157465e-06, "loss": 1.0947, "step": 13620 }, { "epoch": 0.41, "learning_rate": 3.331360623087216e-06, "loss": 1.1441, "step": 13621 }, { "epoch": 0.41, "learning_rate": 3.331130581144533e-06, "loss": 1.1425, "step": 13622 }, { "epoch": 0.41, "learning_rate": 3.330900531289887e-06, "loss": 1.2042, "step": 13623 }, { "epoch": 0.41, "learning_rate": 3.3306704735254684e-06, "loss": 1.1824, "step": 13624 }, { "epoch": 0.41, "learning_rate": 3.330440407853467e-06, "loss": 1.0788, "step": 13625 }, { "epoch": 0.41, "learning_rate": 3.3302103342760717e-06, "loss": 1.2662, "step": 13626 }, { "epoch": 0.41, "learning_rate": 3.329980252795475e-06, "loss": 1.1013, "step": 13627 }, { "epoch": 0.41, "learning_rate": 3.3297501634138663e-06, "loss": 1.0694, "step": 13628 }, { "epoch": 0.41, "learning_rate": 3.329520066133435e-06, "loss": 1.1138, "step": 13629 }, { "epoch": 0.41, "learning_rate": 3.3292899609563722e-06, "loss": 0.9988, "step": 13630 }, { "epoch": 0.41, "learning_rate": 3.3290598478848684e-06, "loss": 1.1514, "step": 13631 }, { "epoch": 0.41, "learning_rate": 3.3288297269211147e-06, "loss": 1.1294, "step": 13632 }, { "epoch": 0.41, "learning_rate": 3.3285995980673004e-06, "loss": 1.1084, "step": 13633 }, { "epoch": 0.41, "learning_rate": 3.3283694613256167e-06, "loss": 1.1257, "step": 13634 }, { "epoch": 0.41, "learning_rate": 3.3281393166982557e-06, "loss": 1.1463, "step": 13635 }, { "epoch": 0.41, "learning_rate": 3.3279091641874066e-06, "loss": 1.1675, "step": 13636 }, { "epoch": 0.41, "learning_rate": 3.3276790037952624e-06, "loss": 1.1917, "step": 13637 }, { "epoch": 0.41, "learning_rate": 3.327448835524011e-06, "loss": 1.1004, "step": 13638 }, { "epoch": 0.41, "learning_rate": 3.3272186593758456e-06, "loss": 1.244, "step": 13639 }, { "epoch": 0.41, "learning_rate": 3.326988475352957e-06, "loss": 1.0873, "step": 13640 }, { "epoch": 0.41, "learning_rate": 3.3267582834575363e-06, "loss": 1.1903, "step": 13641 }, { "epoch": 0.41, "learning_rate": 3.3265280836917754e-06, "loss": 1.1769, "step": 13642 }, { "epoch": 0.41, "learning_rate": 3.3262978760578652e-06, "loss": 1.0928, "step": 13643 }, { "epoch": 0.41, "learning_rate": 3.3260676605579967e-06, "loss": 1.1235, "step": 13644 }, { "epoch": 0.41, "learning_rate": 3.3258374371943625e-06, "loss": 1.1172, "step": 13645 }, { "epoch": 0.41, "learning_rate": 3.325607205969153e-06, "loss": 1.0901, "step": 13646 }, { "epoch": 0.41, "learning_rate": 3.325376966884561e-06, "loss": 1.0919, "step": 13647 }, { "epoch": 0.41, "learning_rate": 3.3251467199427772e-06, "loss": 1.2144, "step": 13648 }, { "epoch": 0.41, "learning_rate": 3.3249164651459942e-06, "loss": 1.169, "step": 13649 }, { "epoch": 0.41, "learning_rate": 3.3246862024964043e-06, "loss": 1.271, "step": 13650 }, { "epoch": 0.41, "learning_rate": 3.324455931996199e-06, "loss": 1.1308, "step": 13651 }, { "epoch": 0.41, "learning_rate": 3.324225653647569e-06, "loss": 1.1581, "step": 13652 }, { "epoch": 0.41, "learning_rate": 3.323995367452709e-06, "loss": 1.1112, "step": 13653 }, { "epoch": 0.41, "learning_rate": 3.32376507341381e-06, "loss": 1.1279, "step": 13654 }, { "epoch": 0.41, "learning_rate": 3.3235347715330633e-06, "loss": 1.165, "step": 13655 }, { "epoch": 0.41, "learning_rate": 3.323304461812663e-06, "loss": 1.1489, "step": 13656 }, { "epoch": 0.41, "learning_rate": 3.3230741442548004e-06, "loss": 1.0748, "step": 13657 }, { "epoch": 0.41, "learning_rate": 3.3228438188616685e-06, "loss": 1.1227, "step": 13658 }, { "epoch": 0.41, "learning_rate": 3.3226134856354596e-06, "loss": 1.1476, "step": 13659 }, { "epoch": 0.41, "learning_rate": 3.3223831445783672e-06, "loss": 1.1823, "step": 13660 }, { "epoch": 0.41, "learning_rate": 3.3221527956925825e-06, "loss": 1.1268, "step": 13661 }, { "epoch": 0.41, "learning_rate": 3.321922438980299e-06, "loss": 1.1316, "step": 13662 }, { "epoch": 0.41, "learning_rate": 3.3216920744437103e-06, "loss": 1.0075, "step": 13663 }, { "epoch": 0.41, "learning_rate": 3.3214617020850087e-06, "loss": 1.1555, "step": 13664 }, { "epoch": 0.41, "learning_rate": 3.3212313219063876e-06, "loss": 1.1906, "step": 13665 }, { "epoch": 0.41, "learning_rate": 3.321000933910039e-06, "loss": 1.1473, "step": 13666 }, { "epoch": 0.41, "learning_rate": 3.320770538098157e-06, "loss": 1.1308, "step": 13667 }, { "epoch": 0.41, "learning_rate": 3.320540134472935e-06, "loss": 1.1985, "step": 13668 }, { "epoch": 0.41, "learning_rate": 3.3203097230365664e-06, "loss": 1.0612, "step": 13669 }, { "epoch": 0.41, "learning_rate": 3.320079303791244e-06, "loss": 1.2013, "step": 13670 }, { "epoch": 0.41, "learning_rate": 3.3198488767391623e-06, "loss": 1.0778, "step": 13671 }, { "epoch": 0.41, "learning_rate": 3.3196184418825133e-06, "loss": 1.1794, "step": 13672 }, { "epoch": 0.41, "learning_rate": 3.3193879992234923e-06, "loss": 1.0818, "step": 13673 }, { "epoch": 0.41, "learning_rate": 3.3191575487642915e-06, "loss": 1.1843, "step": 13674 }, { "epoch": 0.41, "learning_rate": 3.3189270905071054e-06, "loss": 1.1674, "step": 13675 }, { "epoch": 0.41, "learning_rate": 3.318696624454128e-06, "loss": 1.1201, "step": 13676 }, { "epoch": 0.41, "learning_rate": 3.318466150607553e-06, "loss": 1.1459, "step": 13677 }, { "epoch": 0.41, "learning_rate": 3.3182356689695745e-06, "loss": 1.1093, "step": 13678 }, { "epoch": 0.41, "learning_rate": 3.318005179542386e-06, "loss": 1.0835, "step": 13679 }, { "epoch": 0.41, "learning_rate": 3.3177746823281826e-06, "loss": 1.3038, "step": 13680 }, { "epoch": 0.41, "learning_rate": 3.317544177329158e-06, "loss": 1.0217, "step": 13681 }, { "epoch": 0.41, "learning_rate": 3.317313664547507e-06, "loss": 1.0784, "step": 13682 }, { "epoch": 0.41, "learning_rate": 3.3170831439854224e-06, "loss": 1.1624, "step": 13683 }, { "epoch": 0.41, "learning_rate": 3.316852615645101e-06, "loss": 1.1458, "step": 13684 }, { "epoch": 0.41, "learning_rate": 3.316622079528735e-06, "loss": 1.1046, "step": 13685 }, { "epoch": 0.41, "learning_rate": 3.3163915356385214e-06, "loss": 1.2263, "step": 13686 }, { "epoch": 0.41, "learning_rate": 3.316160983976653e-06, "loss": 1.1105, "step": 13687 }, { "epoch": 0.41, "learning_rate": 3.3159304245453246e-06, "loss": 1.1241, "step": 13688 }, { "epoch": 0.41, "learning_rate": 3.3156998573467318e-06, "loss": 1.0848, "step": 13689 }, { "epoch": 0.41, "learning_rate": 3.3154692823830694e-06, "loss": 1.1055, "step": 13690 }, { "epoch": 0.41, "learning_rate": 3.315238699656532e-06, "loss": 1.1706, "step": 13691 }, { "epoch": 0.41, "learning_rate": 3.3150081091693152e-06, "loss": 1.1014, "step": 13692 }, { "epoch": 0.41, "learning_rate": 3.3147775109236136e-06, "loss": 1.2067, "step": 13693 }, { "epoch": 0.41, "learning_rate": 3.3145469049216223e-06, "loss": 1.236, "step": 13694 }, { "epoch": 0.41, "learning_rate": 3.314316291165537e-06, "loss": 1.1801, "step": 13695 }, { "epoch": 0.41, "learning_rate": 3.314085669657552e-06, "loss": 1.0527, "step": 13696 }, { "epoch": 0.41, "learning_rate": 3.313855040399865e-06, "loss": 1.0903, "step": 13697 }, { "epoch": 0.41, "learning_rate": 3.3136244033946687e-06, "loss": 1.3207, "step": 13698 }, { "epoch": 0.41, "learning_rate": 3.3133937586441604e-06, "loss": 1.1545, "step": 13699 }, { "epoch": 0.41, "learning_rate": 3.3131631061505352e-06, "loss": 1.0759, "step": 13700 }, { "epoch": 0.41, "learning_rate": 3.3129324459159886e-06, "loss": 1.1086, "step": 13701 }, { "epoch": 0.41, "learning_rate": 3.3127017779427172e-06, "loss": 1.1605, "step": 13702 }, { "epoch": 0.41, "learning_rate": 3.312471102232916e-06, "loss": 1.1088, "step": 13703 }, { "epoch": 0.41, "learning_rate": 3.3122404187887813e-06, "loss": 1.0797, "step": 13704 }, { "epoch": 0.41, "learning_rate": 3.3120097276125086e-06, "loss": 1.1015, "step": 13705 }, { "epoch": 0.41, "learning_rate": 3.311779028706295e-06, "loss": 1.1368, "step": 13706 }, { "epoch": 0.41, "learning_rate": 3.3115483220723355e-06, "loss": 1.0693, "step": 13707 }, { "epoch": 0.41, "learning_rate": 3.311317607712827e-06, "loss": 1.1619, "step": 13708 }, { "epoch": 0.41, "learning_rate": 3.3110868856299648e-06, "loss": 1.065, "step": 13709 }, { "epoch": 0.41, "learning_rate": 3.3108561558259476e-06, "loss": 1.1396, "step": 13710 }, { "epoch": 0.41, "learning_rate": 3.3106254183029695e-06, "loss": 1.1796, "step": 13711 }, { "epoch": 0.41, "learning_rate": 3.3103946730632286e-06, "loss": 1.0057, "step": 13712 }, { "epoch": 0.41, "learning_rate": 3.3101639201089196e-06, "loss": 1.0549, "step": 13713 }, { "epoch": 0.41, "learning_rate": 3.30993315944224e-06, "loss": 1.1332, "step": 13714 }, { "epoch": 0.41, "learning_rate": 3.309702391065388e-06, "loss": 1.0016, "step": 13715 }, { "epoch": 0.41, "learning_rate": 3.3094716149805588e-06, "loss": 1.1519, "step": 13716 }, { "epoch": 0.41, "learning_rate": 3.3092408311899497e-06, "loss": 1.0935, "step": 13717 }, { "epoch": 0.41, "learning_rate": 3.3090100396957576e-06, "loss": 1.2168, "step": 13718 }, { "epoch": 0.41, "learning_rate": 3.3087792405001802e-06, "loss": 1.0977, "step": 13719 }, { "epoch": 0.41, "learning_rate": 3.308548433605413e-06, "loss": 1.1832, "step": 13720 }, { "epoch": 0.41, "learning_rate": 3.308317619013654e-06, "loss": 1.0873, "step": 13721 }, { "epoch": 0.41, "learning_rate": 3.308086796727101e-06, "loss": 1.0966, "step": 13722 }, { "epoch": 0.41, "learning_rate": 3.307855966747951e-06, "loss": 1.1636, "step": 13723 }, { "epoch": 0.41, "learning_rate": 3.3076251290784004e-06, "loss": 1.1019, "step": 13724 }, { "epoch": 0.41, "learning_rate": 3.3073942837206484e-06, "loss": 1.1126, "step": 13725 }, { "epoch": 0.41, "learning_rate": 3.307163430676892e-06, "loss": 1.1389, "step": 13726 }, { "epoch": 0.41, "learning_rate": 3.3069325699493278e-06, "loss": 1.1224, "step": 13727 }, { "epoch": 0.41, "learning_rate": 3.3067017015401544e-06, "loss": 0.9437, "step": 13728 }, { "epoch": 0.41, "learning_rate": 3.3064708254515693e-06, "loss": 1.2087, "step": 13729 }, { "epoch": 0.41, "learning_rate": 3.3062399416857703e-06, "loss": 1.1324, "step": 13730 }, { "epoch": 0.41, "learning_rate": 3.3060090502449554e-06, "loss": 1.2092, "step": 13731 }, { "epoch": 0.41, "learning_rate": 3.3057781511313225e-06, "loss": 1.1822, "step": 13732 }, { "epoch": 0.41, "learning_rate": 3.30554724434707e-06, "loss": 1.0439, "step": 13733 }, { "epoch": 0.41, "learning_rate": 3.3053163298943946e-06, "loss": 1.1251, "step": 13734 }, { "epoch": 0.41, "learning_rate": 3.305085407775497e-06, "loss": 1.2143, "step": 13735 }, { "epoch": 0.41, "learning_rate": 3.3048544779925734e-06, "loss": 1.1759, "step": 13736 }, { "epoch": 0.41, "learning_rate": 3.3046235405478227e-06, "loss": 1.1177, "step": 13737 }, { "epoch": 0.41, "learning_rate": 3.3043925954434438e-06, "loss": 1.1713, "step": 13738 }, { "epoch": 0.41, "learning_rate": 3.304161642681634e-06, "loss": 1.0344, "step": 13739 }, { "epoch": 0.41, "learning_rate": 3.303930682264594e-06, "loss": 1.0723, "step": 13740 }, { "epoch": 0.41, "learning_rate": 3.3036997141945197e-06, "loss": 1.1417, "step": 13741 }, { "epoch": 0.41, "learning_rate": 3.303468738473612e-06, "loss": 1.0917, "step": 13742 }, { "epoch": 0.41, "learning_rate": 3.303237755104069e-06, "loss": 1.161, "step": 13743 }, { "epoch": 0.41, "learning_rate": 3.303006764088089e-06, "loss": 1.1276, "step": 13744 }, { "epoch": 0.41, "learning_rate": 3.3027757654278715e-06, "loss": 1.2436, "step": 13745 }, { "epoch": 0.41, "learning_rate": 3.3025447591256154e-06, "loss": 1.0299, "step": 13746 }, { "epoch": 0.41, "learning_rate": 3.3023137451835198e-06, "loss": 1.065, "step": 13747 }, { "epoch": 0.41, "learning_rate": 3.3020827236037835e-06, "loss": 1.0447, "step": 13748 }, { "epoch": 0.41, "learning_rate": 3.301851694388606e-06, "loss": 1.12, "step": 13749 }, { "epoch": 0.41, "learning_rate": 3.301620657540186e-06, "loss": 1.1693, "step": 13750 }, { "epoch": 0.41, "learning_rate": 3.3013896130607244e-06, "loss": 1.1627, "step": 13751 }, { "epoch": 0.41, "learning_rate": 3.301158560952419e-06, "loss": 0.9606, "step": 13752 }, { "epoch": 0.41, "learning_rate": 3.3009275012174704e-06, "loss": 1.007, "step": 13753 }, { "epoch": 0.41, "learning_rate": 3.300696433858077e-06, "loss": 1.1345, "step": 13754 }, { "epoch": 0.41, "learning_rate": 3.3004653588764397e-06, "loss": 1.2297, "step": 13755 }, { "epoch": 0.41, "learning_rate": 3.300234276274758e-06, "loss": 1.0969, "step": 13756 }, { "epoch": 0.41, "learning_rate": 3.3000031860552313e-06, "loss": 1.1589, "step": 13757 }, { "epoch": 0.41, "learning_rate": 3.2997720882200597e-06, "loss": 1.0482, "step": 13758 }, { "epoch": 0.41, "learning_rate": 3.299540982771442e-06, "loss": 1.1629, "step": 13759 }, { "epoch": 0.41, "learning_rate": 3.2993098697115805e-06, "loss": 1.118, "step": 13760 }, { "epoch": 0.41, "learning_rate": 3.299078749042673e-06, "loss": 1.2317, "step": 13761 }, { "epoch": 0.41, "learning_rate": 3.2988476207669206e-06, "loss": 1.2063, "step": 13762 }, { "epoch": 0.41, "learning_rate": 3.2986164848865243e-06, "loss": 1.1521, "step": 13763 }, { "epoch": 0.41, "learning_rate": 3.2983853414036838e-06, "loss": 1.2281, "step": 13764 }, { "epoch": 0.41, "learning_rate": 3.2981541903205982e-06, "loss": 1.0627, "step": 13765 }, { "epoch": 0.41, "learning_rate": 3.2979230316394705e-06, "loss": 1.2043, "step": 13766 }, { "epoch": 0.41, "learning_rate": 3.297691865362499e-06, "loss": 1.1003, "step": 13767 }, { "epoch": 0.41, "learning_rate": 3.297460691491885e-06, "loss": 1.1392, "step": 13768 }, { "epoch": 0.41, "learning_rate": 3.29722951002983e-06, "loss": 1.2401, "step": 13769 }, { "epoch": 0.41, "learning_rate": 3.2969983209785337e-06, "loss": 1.1727, "step": 13770 }, { "epoch": 0.41, "learning_rate": 3.2967671243401978e-06, "loss": 1.064, "step": 13771 }, { "epoch": 0.41, "learning_rate": 3.296535920117022e-06, "loss": 1.1916, "step": 13772 }, { "epoch": 0.41, "learning_rate": 3.2963047083112078e-06, "loss": 1.05, "step": 13773 }, { "epoch": 0.41, "learning_rate": 3.296073488924956e-06, "loss": 1.1381, "step": 13774 }, { "epoch": 0.41, "learning_rate": 3.2958422619604678e-06, "loss": 1.1453, "step": 13775 }, { "epoch": 0.42, "learning_rate": 3.295611027419946e-06, "loss": 1.2476, "step": 13776 }, { "epoch": 0.42, "learning_rate": 3.2953797853055892e-06, "loss": 1.1042, "step": 13777 }, { "epoch": 0.42, "learning_rate": 3.2951485356196e-06, "loss": 1.0844, "step": 13778 }, { "epoch": 0.42, "learning_rate": 3.2949172783641803e-06, "loss": 1.1296, "step": 13779 }, { "epoch": 0.42, "learning_rate": 3.2946860135415306e-06, "loss": 1.2281, "step": 13780 }, { "epoch": 0.42, "learning_rate": 3.2944547411538517e-06, "loss": 1.1001, "step": 13781 }, { "epoch": 0.42, "learning_rate": 3.294223461203348e-06, "loss": 1.1024, "step": 13782 }, { "epoch": 0.42, "learning_rate": 3.2939921736922186e-06, "loss": 1.1458, "step": 13783 }, { "epoch": 0.42, "learning_rate": 3.2937608786226665e-06, "loss": 1.0988, "step": 13784 }, { "epoch": 0.42, "learning_rate": 3.293529575996893e-06, "loss": 1.124, "step": 13785 }, { "epoch": 0.42, "learning_rate": 3.2932982658171003e-06, "loss": 1.2455, "step": 13786 }, { "epoch": 0.42, "learning_rate": 3.29306694808549e-06, "loss": 1.1589, "step": 13787 }, { "epoch": 0.42, "learning_rate": 3.2928356228042644e-06, "loss": 1.289, "step": 13788 }, { "epoch": 0.42, "learning_rate": 3.292604289975625e-06, "loss": 1.0418, "step": 13789 }, { "epoch": 0.42, "learning_rate": 3.2923729496017746e-06, "loss": 1.1246, "step": 13790 }, { "epoch": 0.42, "learning_rate": 3.2921416016849157e-06, "loss": 1.1846, "step": 13791 }, { "epoch": 0.42, "learning_rate": 3.29191024622725e-06, "loss": 1.2372, "step": 13792 }, { "epoch": 0.42, "learning_rate": 3.2916788832309803e-06, "loss": 1.219, "step": 13793 }, { "epoch": 0.42, "learning_rate": 3.2914475126983087e-06, "loss": 1.0831, "step": 13794 }, { "epoch": 0.42, "learning_rate": 3.2912161346314387e-06, "loss": 1.2308, "step": 13795 }, { "epoch": 0.42, "learning_rate": 3.2909847490325713e-06, "loss": 1.1187, "step": 13796 }, { "epoch": 0.42, "learning_rate": 3.2907533559039106e-06, "loss": 1.1421, "step": 13797 }, { "epoch": 0.42, "learning_rate": 3.2905219552476587e-06, "loss": 1.1304, "step": 13798 }, { "epoch": 0.42, "learning_rate": 3.2902905470660184e-06, "loss": 1.1917, "step": 13799 }, { "epoch": 0.42, "learning_rate": 3.2900591313611924e-06, "loss": 1.1331, "step": 13800 }, { "epoch": 0.42, "learning_rate": 3.2898277081353846e-06, "loss": 1.1, "step": 13801 }, { "epoch": 0.42, "learning_rate": 3.289596277390797e-06, "loss": 1.0553, "step": 13802 }, { "epoch": 0.42, "learning_rate": 3.2893648391296327e-06, "loss": 1.2032, "step": 13803 }, { "epoch": 0.42, "learning_rate": 3.289133393354096e-06, "loss": 1.1746, "step": 13804 }, { "epoch": 0.42, "learning_rate": 3.288901940066389e-06, "loss": 1.0004, "step": 13805 }, { "epoch": 0.42, "learning_rate": 3.288670479268716e-06, "loss": 1.155, "step": 13806 }, { "epoch": 0.42, "learning_rate": 3.2884390109632793e-06, "loss": 1.1624, "step": 13807 }, { "epoch": 0.42, "learning_rate": 3.2882075351522834e-06, "loss": 1.1169, "step": 13808 }, { "epoch": 0.42, "learning_rate": 3.2879760518379313e-06, "loss": 1.1384, "step": 13809 }, { "epoch": 0.42, "learning_rate": 3.287744561022427e-06, "loss": 1.0988, "step": 13810 }, { "epoch": 0.42, "learning_rate": 3.287513062707973e-06, "loss": 1.2103, "step": 13811 }, { "epoch": 0.42, "learning_rate": 3.287281556896775e-06, "loss": 1.233, "step": 13812 }, { "epoch": 0.42, "learning_rate": 3.2870500435910346e-06, "loss": 1.2034, "step": 13813 }, { "epoch": 0.42, "learning_rate": 3.2868185227929576e-06, "loss": 1.127, "step": 13814 }, { "epoch": 0.42, "learning_rate": 3.286586994504747e-06, "loss": 1.0066, "step": 13815 }, { "epoch": 0.42, "learning_rate": 3.2863554587286067e-06, "loss": 1.009, "step": 13816 }, { "epoch": 0.42, "learning_rate": 3.2861239154667416e-06, "loss": 1.0598, "step": 13817 }, { "epoch": 0.42, "learning_rate": 3.2858923647213553e-06, "loss": 1.1949, "step": 13818 }, { "epoch": 0.42, "learning_rate": 3.285660806494652e-06, "loss": 0.9948, "step": 13819 }, { "epoch": 0.42, "learning_rate": 3.285429240788836e-06, "loss": 1.1487, "step": 13820 }, { "epoch": 0.42, "learning_rate": 3.2851976676061127e-06, "loss": 1.1069, "step": 13821 }, { "epoch": 0.42, "learning_rate": 3.2849660869486853e-06, "loss": 1.1035, "step": 13822 }, { "epoch": 0.42, "learning_rate": 3.284734498818759e-06, "loss": 1.1915, "step": 13823 }, { "epoch": 0.42, "learning_rate": 3.2845029032185384e-06, "loss": 1.1411, "step": 13824 }, { "epoch": 0.42, "learning_rate": 3.284271300150228e-06, "loss": 1.0331, "step": 13825 }, { "epoch": 0.42, "learning_rate": 3.284039689616032e-06, "loss": 1.2944, "step": 13826 }, { "epoch": 0.42, "learning_rate": 3.2838080716181566e-06, "loss": 1.1814, "step": 13827 }, { "epoch": 0.42, "learning_rate": 3.283576446158805e-06, "loss": 1.226, "step": 13828 }, { "epoch": 0.42, "learning_rate": 3.2833448132401836e-06, "loss": 1.1192, "step": 13829 }, { "epoch": 0.42, "learning_rate": 3.283113172864496e-06, "loss": 1.1959, "step": 13830 }, { "epoch": 0.42, "learning_rate": 3.2828815250339484e-06, "loss": 1.2065, "step": 13831 }, { "epoch": 0.42, "learning_rate": 3.2826498697507457e-06, "loss": 1.0792, "step": 13832 }, { "epoch": 0.42, "learning_rate": 3.282418207017094e-06, "loss": 1.1633, "step": 13833 }, { "epoch": 0.42, "learning_rate": 3.282186536835197e-06, "loss": 1.1077, "step": 13834 }, { "epoch": 0.42, "learning_rate": 3.281954859207261e-06, "loss": 1.1507, "step": 13835 }, { "epoch": 0.42, "learning_rate": 3.2817231741354917e-06, "loss": 1.0428, "step": 13836 }, { "epoch": 0.42, "learning_rate": 3.2814914816220938e-06, "loss": 1.2111, "step": 13837 }, { "epoch": 0.42, "learning_rate": 3.281259781669274e-06, "loss": 1.2024, "step": 13838 }, { "epoch": 0.42, "learning_rate": 3.2810280742792367e-06, "loss": 1.1454, "step": 13839 }, { "epoch": 0.42, "learning_rate": 3.2807963594541893e-06, "loss": 1.1187, "step": 13840 }, { "epoch": 0.42, "learning_rate": 3.280564637196336e-06, "loss": 1.1686, "step": 13841 }, { "epoch": 0.42, "learning_rate": 3.280332907507883e-06, "loss": 1.0681, "step": 13842 }, { "epoch": 0.42, "learning_rate": 3.280101170391037e-06, "loss": 1.1874, "step": 13843 }, { "epoch": 0.42, "learning_rate": 3.2798694258480025e-06, "loss": 1.1526, "step": 13844 }, { "epoch": 0.42, "learning_rate": 3.2796376738809876e-06, "loss": 1.0212, "step": 13845 }, { "epoch": 0.42, "learning_rate": 3.2794059144921977e-06, "loss": 1.1208, "step": 13846 }, { "epoch": 0.42, "learning_rate": 3.279174147683838e-06, "loss": 1.0827, "step": 13847 }, { "epoch": 0.42, "learning_rate": 3.278942373458116e-06, "loss": 1.1055, "step": 13848 }, { "epoch": 0.42, "learning_rate": 3.2787105918172386e-06, "loss": 1.2328, "step": 13849 }, { "epoch": 0.42, "learning_rate": 3.2784788027634105e-06, "loss": 1.1387, "step": 13850 }, { "epoch": 0.42, "learning_rate": 3.27824700629884e-06, "loss": 1.0402, "step": 13851 }, { "epoch": 0.42, "learning_rate": 3.2780152024257316e-06, "loss": 1.1561, "step": 13852 }, { "epoch": 0.42, "learning_rate": 3.2777833911462942e-06, "loss": 1.0251, "step": 13853 }, { "epoch": 0.42, "learning_rate": 3.2775515724627327e-06, "loss": 1.1055, "step": 13854 }, { "epoch": 0.42, "learning_rate": 3.2773197463772556e-06, "loss": 1.1989, "step": 13855 }, { "epoch": 0.42, "learning_rate": 3.2770879128920685e-06, "loss": 1.1075, "step": 13856 }, { "epoch": 0.42, "learning_rate": 3.2768560720093786e-06, "loss": 1.1351, "step": 13857 }, { "epoch": 0.42, "learning_rate": 3.2766242237313926e-06, "loss": 1.0368, "step": 13858 }, { "epoch": 0.42, "learning_rate": 3.276392368060319e-06, "loss": 1.1259, "step": 13859 }, { "epoch": 0.42, "learning_rate": 3.276160504998363e-06, "loss": 1.1285, "step": 13860 }, { "epoch": 0.42, "learning_rate": 3.275928634547733e-06, "loss": 1.2323, "step": 13861 }, { "epoch": 0.42, "learning_rate": 3.275696756710637e-06, "loss": 1.0825, "step": 13862 }, { "epoch": 0.42, "learning_rate": 3.2754648714892805e-06, "loss": 1.0646, "step": 13863 }, { "epoch": 0.42, "learning_rate": 3.2752329788858728e-06, "loss": 1.1639, "step": 13864 }, { "epoch": 0.42, "learning_rate": 3.2750010789026194e-06, "loss": 1.0489, "step": 13865 }, { "epoch": 0.42, "learning_rate": 3.27476917154173e-06, "loss": 1.1508, "step": 13866 }, { "epoch": 0.42, "learning_rate": 3.274537256805411e-06, "loss": 1.1083, "step": 13867 }, { "epoch": 0.42, "learning_rate": 3.2743053346958696e-06, "loss": 1.1479, "step": 13868 }, { "epoch": 0.42, "learning_rate": 3.274073405215315e-06, "loss": 1.1049, "step": 13869 }, { "epoch": 0.42, "learning_rate": 3.2738414683659546e-06, "loss": 1.1503, "step": 13870 }, { "epoch": 0.42, "learning_rate": 3.2736095241499953e-06, "loss": 1.1375, "step": 13871 }, { "epoch": 0.42, "learning_rate": 3.2733775725696464e-06, "loss": 1.0598, "step": 13872 }, { "epoch": 0.42, "learning_rate": 3.2731456136271155e-06, "loss": 1.0958, "step": 13873 }, { "epoch": 0.42, "learning_rate": 3.2729136473246102e-06, "loss": 1.1516, "step": 13874 }, { "epoch": 0.42, "learning_rate": 3.27268167366434e-06, "loss": 1.2678, "step": 13875 }, { "epoch": 0.42, "learning_rate": 3.2724496926485118e-06, "loss": 1.1888, "step": 13876 }, { "epoch": 0.42, "learning_rate": 3.272217704279335e-06, "loss": 1.134, "step": 13877 }, { "epoch": 0.42, "learning_rate": 3.271985708559017e-06, "loss": 1.0716, "step": 13878 }, { "epoch": 0.42, "learning_rate": 3.271753705489768e-06, "loss": 1.1605, "step": 13879 }, { "epoch": 0.42, "learning_rate": 3.2715216950737947e-06, "loss": 1.0585, "step": 13880 }, { "epoch": 0.42, "learning_rate": 3.271289677313307e-06, "loss": 1.1019, "step": 13881 }, { "epoch": 0.42, "learning_rate": 3.271057652210512e-06, "loss": 1.2464, "step": 13882 }, { "epoch": 0.42, "learning_rate": 3.27082561976762e-06, "loss": 1.0909, "step": 13883 }, { "epoch": 0.42, "learning_rate": 3.2705935799868393e-06, "loss": 1.1013, "step": 13884 }, { "epoch": 0.42, "learning_rate": 3.2703615328703787e-06, "loss": 1.1637, "step": 13885 }, { "epoch": 0.42, "learning_rate": 3.2701294784204475e-06, "loss": 1.1079, "step": 13886 }, { "epoch": 0.42, "learning_rate": 3.269897416639254e-06, "loss": 1.2158, "step": 13887 }, { "epoch": 0.42, "learning_rate": 3.2696653475290085e-06, "loss": 1.171, "step": 13888 }, { "epoch": 0.42, "learning_rate": 3.2694332710919197e-06, "loss": 1.0838, "step": 13889 }, { "epoch": 0.42, "learning_rate": 3.2692011873301965e-06, "loss": 1.2168, "step": 13890 }, { "epoch": 0.42, "learning_rate": 3.2689690962460483e-06, "loss": 1.1741, "step": 13891 }, { "epoch": 0.42, "learning_rate": 3.2687369978416856e-06, "loss": 1.2181, "step": 13892 }, { "epoch": 0.42, "learning_rate": 3.2685048921193157e-06, "loss": 1.1622, "step": 13893 }, { "epoch": 0.42, "learning_rate": 3.26827277908115e-06, "loss": 1.1461, "step": 13894 }, { "epoch": 0.42, "learning_rate": 3.268040658729397e-06, "loss": 1.1615, "step": 13895 }, { "epoch": 0.42, "learning_rate": 3.2678085310662676e-06, "loss": 1.0565, "step": 13896 }, { "epoch": 0.42, "learning_rate": 3.2675763960939705e-06, "loss": 1.1094, "step": 13897 }, { "epoch": 0.42, "learning_rate": 3.2673442538147148e-06, "loss": 1.1349, "step": 13898 }, { "epoch": 0.42, "learning_rate": 3.2671121042307126e-06, "loss": 1.1786, "step": 13899 }, { "epoch": 0.42, "learning_rate": 3.266879947344172e-06, "loss": 1.1794, "step": 13900 }, { "epoch": 0.42, "learning_rate": 3.266647783157304e-06, "loss": 1.0725, "step": 13901 }, { "epoch": 0.42, "learning_rate": 3.2664156116723177e-06, "loss": 1.0756, "step": 13902 }, { "epoch": 0.42, "learning_rate": 3.266183432891425e-06, "loss": 1.1404, "step": 13903 }, { "epoch": 0.42, "learning_rate": 3.2659512468168342e-06, "loss": 1.1177, "step": 13904 }, { "epoch": 0.42, "learning_rate": 3.2657190534507565e-06, "loss": 1.1741, "step": 13905 }, { "epoch": 0.42, "learning_rate": 3.265486852795402e-06, "loss": 1.2086, "step": 13906 }, { "epoch": 0.42, "learning_rate": 3.265254644852982e-06, "loss": 1.1106, "step": 13907 }, { "epoch": 0.42, "learning_rate": 3.2650224296257062e-06, "loss": 1.1655, "step": 13908 }, { "epoch": 0.42, "learning_rate": 3.264790207115785e-06, "loss": 1.122, "step": 13909 }, { "epoch": 0.42, "learning_rate": 3.264557977325429e-06, "loss": 1.1252, "step": 13910 }, { "epoch": 0.42, "learning_rate": 3.2643257402568505e-06, "loss": 1.1287, "step": 13911 }, { "epoch": 0.42, "learning_rate": 3.264093495912258e-06, "loss": 1.2737, "step": 13912 }, { "epoch": 0.42, "learning_rate": 3.2638612442938635e-06, "loss": 1.0862, "step": 13913 }, { "epoch": 0.42, "learning_rate": 3.2636289854038776e-06, "loss": 1.131, "step": 13914 }, { "epoch": 0.42, "learning_rate": 3.263396719244512e-06, "loss": 1.0198, "step": 13915 }, { "epoch": 0.42, "learning_rate": 3.263164445817978e-06, "loss": 1.0727, "step": 13916 }, { "epoch": 0.42, "learning_rate": 3.2629321651264843e-06, "loss": 1.1983, "step": 13917 }, { "epoch": 0.42, "learning_rate": 3.262699877172246e-06, "loss": 1.1134, "step": 13918 }, { "epoch": 0.42, "learning_rate": 3.26246758195747e-06, "loss": 1.1853, "step": 13919 }, { "epoch": 0.42, "learning_rate": 3.2622352794843716e-06, "loss": 1.1222, "step": 13920 }, { "epoch": 0.42, "learning_rate": 3.262002969755159e-06, "loss": 1.1766, "step": 13921 }, { "epoch": 0.42, "learning_rate": 3.2617706527720465e-06, "loss": 1.1608, "step": 13922 }, { "epoch": 0.42, "learning_rate": 3.261538328537244e-06, "loss": 1.1373, "step": 13923 }, { "epoch": 0.42, "learning_rate": 3.2613059970529625e-06, "loss": 1.0535, "step": 13924 }, { "epoch": 0.42, "learning_rate": 3.2610736583214155e-06, "loss": 1.0031, "step": 13925 }, { "epoch": 0.42, "learning_rate": 3.260841312344813e-06, "loss": 1.1212, "step": 13926 }, { "epoch": 0.42, "learning_rate": 3.2606089591253674e-06, "loss": 1.0627, "step": 13927 }, { "epoch": 0.42, "learning_rate": 3.260376598665291e-06, "loss": 1.1092, "step": 13928 }, { "epoch": 0.42, "learning_rate": 3.2601442309667967e-06, "loss": 1.2169, "step": 13929 }, { "epoch": 0.42, "learning_rate": 3.2599118560320946e-06, "loss": 1.1694, "step": 13930 }, { "epoch": 0.42, "learning_rate": 3.259679473863398e-06, "loss": 1.1624, "step": 13931 }, { "epoch": 0.42, "learning_rate": 3.2594470844629185e-06, "loss": 1.1234, "step": 13932 }, { "epoch": 0.42, "learning_rate": 3.2592146878328685e-06, "loss": 1.0806, "step": 13933 }, { "epoch": 0.42, "learning_rate": 3.2589822839754603e-06, "loss": 1.1169, "step": 13934 }, { "epoch": 0.42, "learning_rate": 3.258749872892907e-06, "loss": 1.0699, "step": 13935 }, { "epoch": 0.42, "learning_rate": 3.258517454587419e-06, "loss": 1.1573, "step": 13936 }, { "epoch": 0.42, "learning_rate": 3.2582850290612113e-06, "loss": 1.2712, "step": 13937 }, { "epoch": 0.42, "learning_rate": 3.2580525963164945e-06, "loss": 1.2386, "step": 13938 }, { "epoch": 0.42, "learning_rate": 3.2578201563554818e-06, "loss": 1.0767, "step": 13939 }, { "epoch": 0.42, "learning_rate": 3.2575877091803864e-06, "loss": 1.1285, "step": 13940 }, { "epoch": 0.42, "learning_rate": 3.2573552547934217e-06, "loss": 1.0687, "step": 13941 }, { "epoch": 0.42, "learning_rate": 3.2571227931967993e-06, "loss": 1.0438, "step": 13942 }, { "epoch": 0.42, "learning_rate": 3.256890324392732e-06, "loss": 1.2101, "step": 13943 }, { "epoch": 0.42, "learning_rate": 3.2566578483834345e-06, "loss": 1.157, "step": 13944 }, { "epoch": 0.42, "learning_rate": 3.2564253651711175e-06, "loss": 1.1058, "step": 13945 }, { "epoch": 0.42, "learning_rate": 3.2561928747579963e-06, "loss": 1.0874, "step": 13946 }, { "epoch": 0.42, "learning_rate": 3.2559603771462826e-06, "loss": 1.0768, "step": 13947 }, { "epoch": 0.42, "learning_rate": 3.255727872338191e-06, "loss": 1.0806, "step": 13948 }, { "epoch": 0.42, "learning_rate": 3.255495360335933e-06, "loss": 1.1392, "step": 13949 }, { "epoch": 0.42, "learning_rate": 3.2552628411417236e-06, "loss": 1.158, "step": 13950 }, { "epoch": 0.42, "learning_rate": 3.255030314757775e-06, "loss": 1.2177, "step": 13951 }, { "epoch": 0.42, "learning_rate": 3.2547977811863024e-06, "loss": 1.2103, "step": 13952 }, { "epoch": 0.42, "learning_rate": 3.254565240429518e-06, "loss": 1.182, "step": 13953 }, { "epoch": 0.42, "learning_rate": 3.2543326924896358e-06, "loss": 1.1174, "step": 13954 }, { "epoch": 0.42, "learning_rate": 3.254100137368869e-06, "loss": 1.2137, "step": 13955 }, { "epoch": 0.42, "learning_rate": 3.2538675750694327e-06, "loss": 1.2219, "step": 13956 }, { "epoch": 0.42, "learning_rate": 3.2536350055935404e-06, "loss": 1.1642, "step": 13957 }, { "epoch": 0.42, "learning_rate": 3.2534024289434058e-06, "loss": 1.1046, "step": 13958 }, { "epoch": 0.42, "learning_rate": 3.253169845121243e-06, "loss": 1.2551, "step": 13959 }, { "epoch": 0.42, "learning_rate": 3.2529372541292658e-06, "loss": 1.0981, "step": 13960 }, { "epoch": 0.42, "learning_rate": 3.2527046559696882e-06, "loss": 1.1583, "step": 13961 }, { "epoch": 0.42, "learning_rate": 3.2524720506447253e-06, "loss": 1.1055, "step": 13962 }, { "epoch": 0.42, "learning_rate": 3.2522394381565915e-06, "loss": 1.0175, "step": 13963 }, { "epoch": 0.42, "learning_rate": 3.2520068185074993e-06, "loss": 1.1382, "step": 13964 }, { "epoch": 0.42, "learning_rate": 3.2517741916996653e-06, "loss": 1.1293, "step": 13965 }, { "epoch": 0.42, "learning_rate": 3.2515415577353025e-06, "loss": 1.1483, "step": 13966 }, { "epoch": 0.42, "learning_rate": 3.2513089166166254e-06, "loss": 1.1649, "step": 13967 }, { "epoch": 0.42, "learning_rate": 3.2510762683458503e-06, "loss": 1.2555, "step": 13968 }, { "epoch": 0.42, "learning_rate": 3.25084361292519e-06, "loss": 1.1627, "step": 13969 }, { "epoch": 0.42, "learning_rate": 3.2506109503568617e-06, "loss": 1.0829, "step": 13970 }, { "epoch": 0.42, "learning_rate": 3.2503782806430774e-06, "loss": 1.0898, "step": 13971 }, { "epoch": 0.42, "learning_rate": 3.2501456037860533e-06, "loss": 1.2435, "step": 13972 }, { "epoch": 0.42, "learning_rate": 3.249912919788005e-06, "loss": 1.2594, "step": 13973 }, { "epoch": 0.42, "learning_rate": 3.2496802286511463e-06, "loss": 1.3842, "step": 13974 }, { "epoch": 0.42, "learning_rate": 3.249447530377693e-06, "loss": 1.0852, "step": 13975 }, { "epoch": 0.42, "learning_rate": 3.24921482496986e-06, "loss": 1.1573, "step": 13976 }, { "epoch": 0.42, "learning_rate": 3.2489821124298633e-06, "loss": 1.1047, "step": 13977 }, { "epoch": 0.42, "learning_rate": 3.2487493927599172e-06, "loss": 1.1625, "step": 13978 }, { "epoch": 0.42, "learning_rate": 3.2485166659622376e-06, "loss": 1.1904, "step": 13979 }, { "epoch": 0.42, "learning_rate": 3.248283932039039e-06, "loss": 1.1514, "step": 13980 }, { "epoch": 0.42, "learning_rate": 3.2480511909925384e-06, "loss": 1.1192, "step": 13981 }, { "epoch": 0.42, "learning_rate": 3.247818442824951e-06, "loss": 1.1276, "step": 13982 }, { "epoch": 0.42, "learning_rate": 3.247585687538492e-06, "loss": 1.2328, "step": 13983 }, { "epoch": 0.42, "learning_rate": 3.247352925135377e-06, "loss": 1.1169, "step": 13984 }, { "epoch": 0.42, "learning_rate": 3.2471201556178226e-06, "loss": 1.0502, "step": 13985 }, { "epoch": 0.42, "learning_rate": 3.246887378988044e-06, "loss": 1.1268, "step": 13986 }, { "epoch": 0.42, "learning_rate": 3.2466545952482576e-06, "loss": 1.2552, "step": 13987 }, { "epoch": 0.42, "learning_rate": 3.2464218044006778e-06, "loss": 1.0886, "step": 13988 }, { "epoch": 0.42, "learning_rate": 3.246189006447523e-06, "loss": 1.1395, "step": 13989 }, { "epoch": 0.42, "learning_rate": 3.2459562013910084e-06, "loss": 1.0376, "step": 13990 }, { "epoch": 0.42, "learning_rate": 3.2457233892333497e-06, "loss": 1.1329, "step": 13991 }, { "epoch": 0.42, "learning_rate": 3.245490569976763e-06, "loss": 1.086, "step": 13992 }, { "epoch": 0.42, "learning_rate": 3.2452577436234656e-06, "loss": 1.1937, "step": 13993 }, { "epoch": 0.42, "learning_rate": 3.2450249101756736e-06, "loss": 1.108, "step": 13994 }, { "epoch": 0.42, "learning_rate": 3.2447920696356027e-06, "loss": 1.1625, "step": 13995 }, { "epoch": 0.42, "learning_rate": 3.24455922200547e-06, "loss": 1.1168, "step": 13996 }, { "epoch": 0.42, "learning_rate": 3.2443263672874923e-06, "loss": 1.0825, "step": 13997 }, { "epoch": 0.42, "learning_rate": 3.2440935054838862e-06, "loss": 1.0559, "step": 13998 }, { "epoch": 0.42, "learning_rate": 3.2438606365968685e-06, "loss": 0.9066, "step": 13999 }, { "epoch": 0.42, "learning_rate": 3.243627760628656e-06, "loss": 1.1467, "step": 14000 }, { "epoch": 0.42, "learning_rate": 3.2433948775814645e-06, "loss": 1.2185, "step": 14001 }, { "epoch": 0.42, "learning_rate": 3.2431619874575126e-06, "loss": 1.0005, "step": 14002 }, { "epoch": 0.42, "learning_rate": 3.242929090259016e-06, "loss": 1.1573, "step": 14003 }, { "epoch": 0.42, "learning_rate": 3.242696185988192e-06, "loss": 1.027, "step": 14004 }, { "epoch": 0.42, "learning_rate": 3.2424632746472584e-06, "loss": 1.2009, "step": 14005 }, { "epoch": 0.42, "learning_rate": 3.2422303562384322e-06, "loss": 1.1554, "step": 14006 }, { "epoch": 0.42, "learning_rate": 3.24199743076393e-06, "loss": 1.1354, "step": 14007 }, { "epoch": 0.42, "learning_rate": 3.24176449822597e-06, "loss": 1.1581, "step": 14008 }, { "epoch": 0.42, "learning_rate": 3.2415315586267694e-06, "loss": 1.0803, "step": 14009 }, { "epoch": 0.42, "learning_rate": 3.241298611968545e-06, "loss": 1.1735, "step": 14010 }, { "epoch": 0.42, "learning_rate": 3.2410656582535148e-06, "loss": 1.2056, "step": 14011 }, { "epoch": 0.42, "learning_rate": 3.2408326974838967e-06, "loss": 1.2797, "step": 14012 }, { "epoch": 0.42, "learning_rate": 3.2405997296619085e-06, "loss": 1.1392, "step": 14013 }, { "epoch": 0.42, "learning_rate": 3.2403667547897666e-06, "loss": 1.0595, "step": 14014 }, { "epoch": 0.42, "learning_rate": 3.240133772869691e-06, "loss": 1.0581, "step": 14015 }, { "epoch": 0.42, "learning_rate": 3.2399007839038977e-06, "loss": 1.1697, "step": 14016 }, { "epoch": 0.42, "learning_rate": 3.2396677878946055e-06, "loss": 1.2198, "step": 14017 }, { "epoch": 0.42, "learning_rate": 3.2394347848440317e-06, "loss": 1.1759, "step": 14018 }, { "epoch": 0.42, "learning_rate": 3.239201774754395e-06, "loss": 1.1329, "step": 14019 }, { "epoch": 0.42, "learning_rate": 3.2389687576279135e-06, "loss": 1.1576, "step": 14020 }, { "epoch": 0.42, "learning_rate": 3.2387357334668053e-06, "loss": 1.1906, "step": 14021 }, { "epoch": 0.42, "learning_rate": 3.2385027022732882e-06, "loss": 1.2283, "step": 14022 }, { "epoch": 0.42, "learning_rate": 3.238269664049582e-06, "loss": 1.0904, "step": 14023 }, { "epoch": 0.42, "learning_rate": 3.238036618797904e-06, "loss": 1.1935, "step": 14024 }, { "epoch": 0.42, "learning_rate": 3.2378035665204723e-06, "loss": 1.0507, "step": 14025 }, { "epoch": 0.42, "learning_rate": 3.2375705072195065e-06, "loss": 1.1317, "step": 14026 }, { "epoch": 0.42, "learning_rate": 3.237337440897224e-06, "loss": 1.1392, "step": 14027 }, { "epoch": 0.42, "learning_rate": 3.2371043675558456e-06, "loss": 1.2231, "step": 14028 }, { "epoch": 0.42, "learning_rate": 3.236871287197587e-06, "loss": 1.1907, "step": 14029 }, { "epoch": 0.42, "learning_rate": 3.23663819982467e-06, "loss": 1.208, "step": 14030 }, { "epoch": 0.42, "learning_rate": 3.236405105439311e-06, "loss": 1.0516, "step": 14031 }, { "epoch": 0.42, "learning_rate": 3.2361720040437307e-06, "loss": 1.1077, "step": 14032 }, { "epoch": 0.42, "learning_rate": 3.2359388956401472e-06, "loss": 1.1606, "step": 14033 }, { "epoch": 0.42, "learning_rate": 3.23570578023078e-06, "loss": 1.0013, "step": 14034 }, { "epoch": 0.42, "learning_rate": 3.235472657817848e-06, "loss": 1.074, "step": 14035 }, { "epoch": 0.42, "learning_rate": 3.2352395284035703e-06, "loss": 1.2125, "step": 14036 }, { "epoch": 0.42, "learning_rate": 3.235006391990166e-06, "loss": 1.0896, "step": 14037 }, { "epoch": 0.42, "learning_rate": 3.234773248579856e-06, "loss": 1.1959, "step": 14038 }, { "epoch": 0.42, "learning_rate": 3.234540098174858e-06, "loss": 1.0712, "step": 14039 }, { "epoch": 0.42, "learning_rate": 3.234306940777392e-06, "loss": 1.1118, "step": 14040 }, { "epoch": 0.42, "learning_rate": 3.2340737763896778e-06, "loss": 1.0717, "step": 14041 }, { "epoch": 0.42, "learning_rate": 3.2338406050139346e-06, "loss": 1.2367, "step": 14042 }, { "epoch": 0.42, "learning_rate": 3.2336074266523825e-06, "loss": 1.1395, "step": 14043 }, { "epoch": 0.42, "learning_rate": 3.233374241307241e-06, "loss": 1.1004, "step": 14044 }, { "epoch": 0.42, "learning_rate": 3.23314104898073e-06, "loss": 1.075, "step": 14045 }, { "epoch": 0.42, "learning_rate": 3.2329078496750687e-06, "loss": 1.0479, "step": 14046 }, { "epoch": 0.42, "learning_rate": 3.232674643392478e-06, "loss": 1.0928, "step": 14047 }, { "epoch": 0.42, "learning_rate": 3.232441430135178e-06, "loss": 1.0748, "step": 14048 }, { "epoch": 0.42, "learning_rate": 3.2322082099053873e-06, "loss": 1.035, "step": 14049 }, { "epoch": 0.42, "learning_rate": 3.2319749827053275e-06, "loss": 1.2402, "step": 14050 }, { "epoch": 0.42, "learning_rate": 3.231741748537219e-06, "loss": 1.1993, "step": 14051 }, { "epoch": 0.42, "learning_rate": 3.231508507403281e-06, "loss": 1.1056, "step": 14052 }, { "epoch": 0.42, "learning_rate": 3.231275259305734e-06, "loss": 0.9988, "step": 14053 }, { "epoch": 0.42, "learning_rate": 3.2310420042467995e-06, "loss": 1.0735, "step": 14054 }, { "epoch": 0.42, "learning_rate": 3.2308087422286966e-06, "loss": 1.1591, "step": 14055 }, { "epoch": 0.42, "learning_rate": 3.230575473253647e-06, "loss": 1.0576, "step": 14056 }, { "epoch": 0.42, "learning_rate": 3.23034219732387e-06, "loss": 1.0836, "step": 14057 }, { "epoch": 0.42, "learning_rate": 3.230108914441588e-06, "loss": 1.1917, "step": 14058 }, { "epoch": 0.42, "learning_rate": 3.2298756246090204e-06, "loss": 1.0344, "step": 14059 }, { "epoch": 0.42, "learning_rate": 3.229642327828387e-06, "loss": 1.2397, "step": 14060 }, { "epoch": 0.42, "learning_rate": 3.229409024101912e-06, "loss": 1.1139, "step": 14061 }, { "epoch": 0.42, "learning_rate": 3.2291757134318134e-06, "loss": 1.3579, "step": 14062 }, { "epoch": 0.42, "learning_rate": 3.228942395820313e-06, "loss": 1.062, "step": 14063 }, { "epoch": 0.42, "learning_rate": 3.2287090712696335e-06, "loss": 1.1537, "step": 14064 }, { "epoch": 0.42, "learning_rate": 3.2284757397819934e-06, "loss": 1.0523, "step": 14065 }, { "epoch": 0.42, "learning_rate": 3.228242401359615e-06, "loss": 1.0563, "step": 14066 }, { "epoch": 0.42, "learning_rate": 3.22800905600472e-06, "loss": 1.2422, "step": 14067 }, { "epoch": 0.42, "learning_rate": 3.227775703719529e-06, "loss": 1.067, "step": 14068 }, { "epoch": 0.42, "learning_rate": 3.2275423445062647e-06, "loss": 1.2274, "step": 14069 }, { "epoch": 0.42, "learning_rate": 3.227308978367147e-06, "loss": 1.1667, "step": 14070 }, { "epoch": 0.42, "learning_rate": 3.227075605304398e-06, "loss": 1.153, "step": 14071 }, { "epoch": 0.42, "learning_rate": 3.22684222532024e-06, "loss": 1.1552, "step": 14072 }, { "epoch": 0.42, "learning_rate": 3.226608838416893e-06, "loss": 1.3093, "step": 14073 }, { "epoch": 0.42, "learning_rate": 3.226375444596581e-06, "loss": 1.2393, "step": 14074 }, { "epoch": 0.42, "learning_rate": 3.2261420438615245e-06, "loss": 1.1036, "step": 14075 }, { "epoch": 0.42, "learning_rate": 3.2259086362139447e-06, "loss": 1.1353, "step": 14076 }, { "epoch": 0.42, "learning_rate": 3.225675221656065e-06, "loss": 1.1122, "step": 14077 }, { "epoch": 0.42, "learning_rate": 3.2254418001901056e-06, "loss": 1.1007, "step": 14078 }, { "epoch": 0.42, "learning_rate": 3.22520837181829e-06, "loss": 1.1531, "step": 14079 }, { "epoch": 0.42, "learning_rate": 3.224974936542841e-06, "loss": 1.1776, "step": 14080 }, { "epoch": 0.42, "learning_rate": 3.2247414943659794e-06, "loss": 1.1692, "step": 14081 }, { "epoch": 0.42, "learning_rate": 3.2245080452899276e-06, "loss": 1.1262, "step": 14082 }, { "epoch": 0.42, "learning_rate": 3.224274589316908e-06, "loss": 1.1241, "step": 14083 }, { "epoch": 0.42, "learning_rate": 3.2240411264491433e-06, "loss": 1.2077, "step": 14084 }, { "epoch": 0.42, "learning_rate": 3.2238076566888552e-06, "loss": 1.1398, "step": 14085 }, { "epoch": 0.42, "learning_rate": 3.223574180038268e-06, "loss": 1.0545, "step": 14086 }, { "epoch": 0.42, "learning_rate": 3.223340696499603e-06, "loss": 1.175, "step": 14087 }, { "epoch": 0.42, "learning_rate": 3.2231072060750816e-06, "loss": 1.1699, "step": 14088 }, { "epoch": 0.42, "learning_rate": 3.2228737087669295e-06, "loss": 1.154, "step": 14089 }, { "epoch": 0.42, "learning_rate": 3.2226402045773665e-06, "loss": 1.1021, "step": 14090 }, { "epoch": 0.42, "learning_rate": 3.222406693508617e-06, "loss": 1.2538, "step": 14091 }, { "epoch": 0.42, "learning_rate": 3.222173175562904e-06, "loss": 1.0997, "step": 14092 }, { "epoch": 0.42, "learning_rate": 3.22193965074245e-06, "loss": 1.1769, "step": 14093 }, { "epoch": 0.42, "learning_rate": 3.221706119049478e-06, "loss": 1.1184, "step": 14094 }, { "epoch": 0.42, "learning_rate": 3.221472580486212e-06, "loss": 1.0641, "step": 14095 }, { "epoch": 0.42, "learning_rate": 3.2212390350548746e-06, "loss": 0.9837, "step": 14096 }, { "epoch": 0.42, "learning_rate": 3.2210054827576887e-06, "loss": 1.1411, "step": 14097 }, { "epoch": 0.42, "learning_rate": 3.220771923596877e-06, "loss": 1.1364, "step": 14098 }, { "epoch": 0.42, "learning_rate": 3.2205383575746645e-06, "loss": 1.115, "step": 14099 }, { "epoch": 0.42, "learning_rate": 3.2203047846932743e-06, "loss": 1.1016, "step": 14100 }, { "epoch": 0.42, "learning_rate": 3.220071204954929e-06, "loss": 1.0609, "step": 14101 }, { "epoch": 0.42, "learning_rate": 3.2198376183618524e-06, "loss": 1.0888, "step": 14102 }, { "epoch": 0.42, "learning_rate": 3.2196040249162684e-06, "loss": 1.1331, "step": 14103 }, { "epoch": 0.42, "learning_rate": 3.2193704246204003e-06, "loss": 1.0806, "step": 14104 }, { "epoch": 0.42, "learning_rate": 3.2191368174764737e-06, "loss": 1.1544, "step": 14105 }, { "epoch": 0.42, "learning_rate": 3.2189032034867094e-06, "loss": 1.2178, "step": 14106 }, { "epoch": 0.42, "learning_rate": 3.2186695826533332e-06, "loss": 1.1713, "step": 14107 }, { "epoch": 0.43, "learning_rate": 3.2184359549785693e-06, "loss": 1.1732, "step": 14108 }, { "epoch": 0.43, "learning_rate": 3.2182023204646407e-06, "loss": 1.0192, "step": 14109 }, { "epoch": 0.43, "learning_rate": 3.217968679113772e-06, "loss": 1.2174, "step": 14110 }, { "epoch": 0.43, "learning_rate": 3.2177350309281867e-06, "loss": 1.1639, "step": 14111 }, { "epoch": 0.43, "learning_rate": 3.2175013759101103e-06, "loss": 1.0807, "step": 14112 }, { "epoch": 0.43, "learning_rate": 3.2172677140617666e-06, "loss": 1.0448, "step": 14113 }, { "epoch": 0.43, "learning_rate": 3.217034045385379e-06, "loss": 1.1855, "step": 14114 }, { "epoch": 0.43, "learning_rate": 3.216800369883173e-06, "loss": 1.2028, "step": 14115 }, { "epoch": 0.43, "learning_rate": 3.216566687557372e-06, "loss": 1.1774, "step": 14116 }, { "epoch": 0.43, "learning_rate": 3.216332998410202e-06, "loss": 1.1822, "step": 14117 }, { "epoch": 0.43, "learning_rate": 3.216099302443887e-06, "loss": 1.1145, "step": 14118 }, { "epoch": 0.43, "learning_rate": 3.215865599660651e-06, "loss": 1.0624, "step": 14119 }, { "epoch": 0.43, "learning_rate": 3.2156318900627194e-06, "loss": 1.1592, "step": 14120 }, { "epoch": 0.43, "learning_rate": 3.2153981736523164e-06, "loss": 1.1619, "step": 14121 }, { "epoch": 0.43, "learning_rate": 3.215164450431668e-06, "loss": 1.0859, "step": 14122 }, { "epoch": 0.43, "learning_rate": 3.2149307204029988e-06, "loss": 1.0911, "step": 14123 }, { "epoch": 0.43, "learning_rate": 3.214696983568533e-06, "loss": 1.1553, "step": 14124 }, { "epoch": 0.43, "learning_rate": 3.214463239930496e-06, "loss": 1.2103, "step": 14125 }, { "epoch": 0.43, "learning_rate": 3.214229489491113e-06, "loss": 1.2347, "step": 14126 }, { "epoch": 0.43, "learning_rate": 3.2139957322526096e-06, "loss": 1.0574, "step": 14127 }, { "epoch": 0.43, "learning_rate": 3.2137619682172107e-06, "loss": 1.1689, "step": 14128 }, { "epoch": 0.43, "learning_rate": 3.2135281973871414e-06, "loss": 1.1288, "step": 14129 }, { "epoch": 0.43, "learning_rate": 3.2132944197646272e-06, "loss": 1.1266, "step": 14130 }, { "epoch": 0.43, "learning_rate": 3.2130606353518933e-06, "loss": 1.0892, "step": 14131 }, { "epoch": 0.43, "learning_rate": 3.212826844151166e-06, "loss": 1.1177, "step": 14132 }, { "epoch": 0.43, "learning_rate": 3.2125930461646703e-06, "loss": 1.1094, "step": 14133 }, { "epoch": 0.43, "learning_rate": 3.2123592413946324e-06, "loss": 1.1127, "step": 14134 }, { "epoch": 0.43, "learning_rate": 3.2121254298432776e-06, "loss": 1.062, "step": 14135 }, { "epoch": 0.43, "learning_rate": 3.2118916115128317e-06, "loss": 1.2609, "step": 14136 }, { "epoch": 0.43, "learning_rate": 3.2116577864055196e-06, "loss": 1.1127, "step": 14137 }, { "epoch": 0.43, "learning_rate": 3.21142395452357e-06, "loss": 1.2341, "step": 14138 }, { "epoch": 0.43, "learning_rate": 3.2111901158692054e-06, "loss": 1.141, "step": 14139 }, { "epoch": 0.43, "learning_rate": 3.2109562704446536e-06, "loss": 1.0448, "step": 14140 }, { "epoch": 0.43, "learning_rate": 3.210722418252141e-06, "loss": 1.1153, "step": 14141 }, { "epoch": 0.43, "learning_rate": 3.2104885592938926e-06, "loss": 1.1525, "step": 14142 }, { "epoch": 0.43, "learning_rate": 3.2102546935721363e-06, "loss": 1.156, "step": 14143 }, { "epoch": 0.43, "learning_rate": 3.2100208210890967e-06, "loss": 1.1439, "step": 14144 }, { "epoch": 0.43, "learning_rate": 3.209786941847001e-06, "loss": 1.1379, "step": 14145 }, { "epoch": 0.43, "learning_rate": 3.2095530558480746e-06, "loss": 1.0839, "step": 14146 }, { "epoch": 0.43, "learning_rate": 3.2093191630945463e-06, "loss": 1.0849, "step": 14147 }, { "epoch": 0.43, "learning_rate": 3.2090852635886404e-06, "loss": 1.153, "step": 14148 }, { "epoch": 0.43, "learning_rate": 3.208851357332585e-06, "loss": 1.2313, "step": 14149 }, { "epoch": 0.43, "learning_rate": 3.208617444328605e-06, "loss": 1.1984, "step": 14150 }, { "epoch": 0.43, "learning_rate": 3.2083835245789292e-06, "loss": 1.1978, "step": 14151 }, { "epoch": 0.43, "learning_rate": 3.2081495980857824e-06, "loss": 1.0131, "step": 14152 }, { "epoch": 0.43, "learning_rate": 3.2079156648513934e-06, "loss": 1.0875, "step": 14153 }, { "epoch": 0.43, "learning_rate": 3.2076817248779878e-06, "loss": 1.0875, "step": 14154 }, { "epoch": 0.43, "learning_rate": 3.2074477781677924e-06, "loss": 1.1246, "step": 14155 }, { "epoch": 0.43, "learning_rate": 3.207213824723036e-06, "loss": 1.0508, "step": 14156 }, { "epoch": 0.43, "learning_rate": 3.206979864545944e-06, "loss": 1.0758, "step": 14157 }, { "epoch": 0.43, "learning_rate": 3.2067458976387442e-06, "loss": 1.2281, "step": 14158 }, { "epoch": 0.43, "learning_rate": 3.206511924003664e-06, "loss": 1.095, "step": 14159 }, { "epoch": 0.43, "learning_rate": 3.2062779436429304e-06, "loss": 1.1505, "step": 14160 }, { "epoch": 0.43, "learning_rate": 3.2060439565587708e-06, "loss": 1.2157, "step": 14161 }, { "epoch": 0.43, "learning_rate": 3.2058099627534136e-06, "loss": 1.233, "step": 14162 }, { "epoch": 0.43, "learning_rate": 3.2055759622290844e-06, "loss": 1.2139, "step": 14163 }, { "epoch": 0.43, "learning_rate": 3.2053419549880127e-06, "loss": 1.1658, "step": 14164 }, { "epoch": 0.43, "learning_rate": 3.2051079410324248e-06, "loss": 1.0625, "step": 14165 }, { "epoch": 0.43, "learning_rate": 3.2048739203645484e-06, "loss": 1.0929, "step": 14166 }, { "epoch": 0.43, "learning_rate": 3.204639892986613e-06, "loss": 1.1766, "step": 14167 }, { "epoch": 0.43, "learning_rate": 3.204405858900844e-06, "loss": 1.1773, "step": 14168 }, { "epoch": 0.43, "learning_rate": 3.2041718181094716e-06, "loss": 1.0535, "step": 14169 }, { "epoch": 0.43, "learning_rate": 3.203937770614722e-06, "loss": 1.163, "step": 14170 }, { "epoch": 0.43, "learning_rate": 3.2037037164188246e-06, "loss": 1.1348, "step": 14171 }, { "epoch": 0.43, "learning_rate": 3.203469655524005e-06, "loss": 1.2054, "step": 14172 }, { "epoch": 0.43, "learning_rate": 3.2032355879324945e-06, "loss": 1.1327, "step": 14173 }, { "epoch": 0.43, "learning_rate": 3.203001513646519e-06, "loss": 1.1185, "step": 14174 }, { "epoch": 0.43, "learning_rate": 3.202767432668309e-06, "loss": 1.1311, "step": 14175 }, { "epoch": 0.43, "learning_rate": 3.20253334500009e-06, "loss": 1.076, "step": 14176 }, { "epoch": 0.43, "learning_rate": 3.202299250644093e-06, "loss": 1.0887, "step": 14177 }, { "epoch": 0.43, "learning_rate": 3.2020651496025444e-06, "loss": 1.0871, "step": 14178 }, { "epoch": 0.43, "learning_rate": 3.201831041877674e-06, "loss": 1.1032, "step": 14179 }, { "epoch": 0.43, "learning_rate": 3.2015969274717113e-06, "loss": 1.2263, "step": 14180 }, { "epoch": 0.43, "learning_rate": 3.201362806386883e-06, "loss": 1.0435, "step": 14181 }, { "epoch": 0.43, "learning_rate": 3.201128678625418e-06, "loss": 1.0607, "step": 14182 }, { "epoch": 0.43, "learning_rate": 3.2008945441895463e-06, "loss": 1.1316, "step": 14183 }, { "epoch": 0.43, "learning_rate": 3.2006604030814957e-06, "loss": 1.0912, "step": 14184 }, { "epoch": 0.43, "learning_rate": 3.200426255303496e-06, "loss": 1.0804, "step": 14185 }, { "epoch": 0.43, "learning_rate": 3.200192100857775e-06, "loss": 1.1288, "step": 14186 }, { "epoch": 0.43, "learning_rate": 3.1999579397465624e-06, "loss": 1.2278, "step": 14187 }, { "epoch": 0.43, "learning_rate": 3.199723771972088e-06, "loss": 1.2405, "step": 14188 }, { "epoch": 0.43, "learning_rate": 3.1994895975365796e-06, "loss": 1.1688, "step": 14189 }, { "epoch": 0.43, "learning_rate": 3.1992554164422686e-06, "loss": 1.1512, "step": 14190 }, { "epoch": 0.43, "learning_rate": 3.1990212286913815e-06, "loss": 1.0823, "step": 14191 }, { "epoch": 0.43, "learning_rate": 3.1987870342861484e-06, "loss": 1.1111, "step": 14192 }, { "epoch": 0.43, "learning_rate": 3.1985528332288006e-06, "loss": 1.2104, "step": 14193 }, { "epoch": 0.43, "learning_rate": 3.1983186255215653e-06, "loss": 1.213, "step": 14194 }, { "epoch": 0.43, "learning_rate": 3.198084411166674e-06, "loss": 1.038, "step": 14195 }, { "epoch": 0.43, "learning_rate": 3.1978501901663546e-06, "loss": 1.0996, "step": 14196 }, { "epoch": 0.43, "learning_rate": 3.1976159625228376e-06, "loss": 0.9658, "step": 14197 }, { "epoch": 0.43, "learning_rate": 3.1973817282383524e-06, "loss": 1.1104, "step": 14198 }, { "epoch": 0.43, "learning_rate": 3.19714748731513e-06, "loss": 1.1414, "step": 14199 }, { "epoch": 0.43, "learning_rate": 3.196913239755398e-06, "loss": 1.0386, "step": 14200 }, { "epoch": 0.43, "learning_rate": 3.1966789855613877e-06, "loss": 1.1166, "step": 14201 }, { "epoch": 0.43, "learning_rate": 3.1964447247353297e-06, "loss": 1.0743, "step": 14202 }, { "epoch": 0.43, "learning_rate": 3.1962104572794532e-06, "loss": 1.0854, "step": 14203 }, { "epoch": 0.43, "learning_rate": 3.195976183195988e-06, "loss": 1.1428, "step": 14204 }, { "epoch": 0.43, "learning_rate": 3.1957419024871654e-06, "loss": 1.124, "step": 14205 }, { "epoch": 0.43, "learning_rate": 3.1955076151552145e-06, "loss": 1.1285, "step": 14206 }, { "epoch": 0.43, "learning_rate": 3.195273321202366e-06, "loss": 1.233, "step": 14207 }, { "epoch": 0.43, "learning_rate": 3.195039020630851e-06, "loss": 1.1855, "step": 14208 }, { "epoch": 0.43, "learning_rate": 3.1948047134428982e-06, "loss": 1.1044, "step": 14209 }, { "epoch": 0.43, "learning_rate": 3.194570399640741e-06, "loss": 1.2596, "step": 14210 }, { "epoch": 0.43, "learning_rate": 3.194336079226606e-06, "loss": 1.2147, "step": 14211 }, { "epoch": 0.43, "learning_rate": 3.1941017522027272e-06, "loss": 1.0565, "step": 14212 }, { "epoch": 0.43, "learning_rate": 3.1938674185713337e-06, "loss": 1.2635, "step": 14213 }, { "epoch": 0.43, "learning_rate": 3.1936330783346557e-06, "loss": 1.1415, "step": 14214 }, { "epoch": 0.43, "learning_rate": 3.1933987314949255e-06, "loss": 1.1327, "step": 14215 }, { "epoch": 0.43, "learning_rate": 3.1931643780543744e-06, "loss": 1.1044, "step": 14216 }, { "epoch": 0.43, "learning_rate": 3.1929300180152307e-06, "loss": 1.0764, "step": 14217 }, { "epoch": 0.43, "learning_rate": 3.192695651379728e-06, "loss": 1.1461, "step": 14218 }, { "epoch": 0.43, "learning_rate": 3.192461278150096e-06, "loss": 1.2135, "step": 14219 }, { "epoch": 0.43, "learning_rate": 3.1922268983285654e-06, "loss": 1.0907, "step": 14220 }, { "epoch": 0.43, "learning_rate": 3.191992511917369e-06, "loss": 1.1049, "step": 14221 }, { "epoch": 0.43, "learning_rate": 3.191758118918737e-06, "loss": 1.1227, "step": 14222 }, { "epoch": 0.43, "learning_rate": 3.1915237193349008e-06, "loss": 1.1851, "step": 14223 }, { "epoch": 0.43, "learning_rate": 3.1912893131680915e-06, "loss": 1.0811, "step": 14224 }, { "epoch": 0.43, "learning_rate": 3.1910549004205414e-06, "loss": 1.0394, "step": 14225 }, { "epoch": 0.43, "learning_rate": 3.190820481094481e-06, "loss": 1.0657, "step": 14226 }, { "epoch": 0.43, "learning_rate": 3.1905860551921426e-06, "loss": 1.1124, "step": 14227 }, { "epoch": 0.43, "learning_rate": 3.1903516227157573e-06, "loss": 1.1346, "step": 14228 }, { "epoch": 0.43, "learning_rate": 3.1901171836675576e-06, "loss": 1.2043, "step": 14229 }, { "epoch": 0.43, "learning_rate": 3.189882738049774e-06, "loss": 1.1508, "step": 14230 }, { "epoch": 0.43, "learning_rate": 3.18964828586464e-06, "loss": 1.1013, "step": 14231 }, { "epoch": 0.43, "learning_rate": 3.1894138271143852e-06, "loss": 1.0662, "step": 14232 }, { "epoch": 0.43, "learning_rate": 3.1891793618012435e-06, "loss": 1.1658, "step": 14233 }, { "epoch": 0.43, "learning_rate": 3.1889448899274466e-06, "loss": 1.1615, "step": 14234 }, { "epoch": 0.43, "learning_rate": 3.188710411495225e-06, "loss": 1.1505, "step": 14235 }, { "epoch": 0.43, "learning_rate": 3.1884759265068134e-06, "loss": 1.1528, "step": 14236 }, { "epoch": 0.43, "learning_rate": 3.1882414349644414e-06, "loss": 1.144, "step": 14237 }, { "epoch": 0.43, "learning_rate": 3.1880069368703433e-06, "loss": 1.2612, "step": 14238 }, { "epoch": 0.43, "learning_rate": 3.1877724322267496e-06, "loss": 1.175, "step": 14239 }, { "epoch": 0.43, "learning_rate": 3.187537921035894e-06, "loss": 1.0212, "step": 14240 }, { "epoch": 0.43, "learning_rate": 3.187303403300009e-06, "loss": 1.0782, "step": 14241 }, { "epoch": 0.43, "learning_rate": 3.1870688790213256e-06, "loss": 1.1885, "step": 14242 }, { "epoch": 0.43, "learning_rate": 3.186834348202078e-06, "loss": 1.0489, "step": 14243 }, { "epoch": 0.43, "learning_rate": 3.1865998108444983e-06, "loss": 1.0397, "step": 14244 }, { "epoch": 0.43, "learning_rate": 3.1863652669508183e-06, "loss": 1.202, "step": 14245 }, { "epoch": 0.43, "learning_rate": 3.1861307165232723e-06, "loss": 1.1162, "step": 14246 }, { "epoch": 0.43, "learning_rate": 3.1858961595640926e-06, "loss": 1.1177, "step": 14247 }, { "epoch": 0.43, "learning_rate": 3.185661596075511e-06, "loss": 1.2059, "step": 14248 }, { "epoch": 0.43, "learning_rate": 3.185427026059762e-06, "loss": 1.2133, "step": 14249 }, { "epoch": 0.43, "learning_rate": 3.185192449519077e-06, "loss": 1.0421, "step": 14250 }, { "epoch": 0.43, "learning_rate": 3.184957866455691e-06, "loss": 1.2275, "step": 14251 }, { "epoch": 0.43, "learning_rate": 3.184723276871835e-06, "loss": 1.192, "step": 14252 }, { "epoch": 0.43, "learning_rate": 3.1844886807697435e-06, "loss": 1.1912, "step": 14253 }, { "epoch": 0.43, "learning_rate": 3.1842540781516496e-06, "loss": 1.2529, "step": 14254 }, { "epoch": 0.43, "learning_rate": 3.1840194690197856e-06, "loss": 1.079, "step": 14255 }, { "epoch": 0.43, "learning_rate": 3.1837848533763858e-06, "loss": 1.182, "step": 14256 }, { "epoch": 0.43, "learning_rate": 3.1835502312236843e-06, "loss": 1.1383, "step": 14257 }, { "epoch": 0.43, "learning_rate": 3.183315602563913e-06, "loss": 1.1676, "step": 14258 }, { "epoch": 0.43, "learning_rate": 3.1830809673993076e-06, "loss": 1.1171, "step": 14259 }, { "epoch": 0.43, "learning_rate": 3.1828463257320995e-06, "loss": 1.0577, "step": 14260 }, { "epoch": 0.43, "learning_rate": 3.1826116775645235e-06, "loss": 1.0831, "step": 14261 }, { "epoch": 0.43, "learning_rate": 3.1823770228988126e-06, "loss": 1.1395, "step": 14262 }, { "epoch": 0.43, "learning_rate": 3.1821423617372014e-06, "loss": 1.1611, "step": 14263 }, { "epoch": 0.43, "learning_rate": 3.181907694081924e-06, "loss": 1.1998, "step": 14264 }, { "epoch": 0.43, "learning_rate": 3.181673019935213e-06, "loss": 1.0291, "step": 14265 }, { "epoch": 0.43, "learning_rate": 3.1814383392993033e-06, "loss": 1.1189, "step": 14266 }, { "epoch": 0.43, "learning_rate": 3.1812036521764287e-06, "loss": 1.1568, "step": 14267 }, { "epoch": 0.43, "learning_rate": 3.1809689585688237e-06, "loss": 1.1324, "step": 14268 }, { "epoch": 0.43, "learning_rate": 3.1807342584787217e-06, "loss": 1.1587, "step": 14269 }, { "epoch": 0.43, "learning_rate": 3.180499551908358e-06, "loss": 1.1293, "step": 14270 }, { "epoch": 0.43, "learning_rate": 3.1802648388599654e-06, "loss": 1.0603, "step": 14271 }, { "epoch": 0.43, "learning_rate": 3.18003011933578e-06, "loss": 1.0816, "step": 14272 }, { "epoch": 0.43, "learning_rate": 3.1797953933380353e-06, "loss": 1.2656, "step": 14273 }, { "epoch": 0.43, "learning_rate": 3.1795606608689656e-06, "loss": 1.1287, "step": 14274 }, { "epoch": 0.43, "learning_rate": 3.1793259219308063e-06, "loss": 1.1922, "step": 14275 }, { "epoch": 0.43, "learning_rate": 3.179091176525791e-06, "loss": 1.224, "step": 14276 }, { "epoch": 0.43, "learning_rate": 3.178856424656155e-06, "loss": 1.037, "step": 14277 }, { "epoch": 0.43, "learning_rate": 3.178621666324132e-06, "loss": 1.0845, "step": 14278 }, { "epoch": 0.43, "learning_rate": 3.1783869015319585e-06, "loss": 1.0598, "step": 14279 }, { "epoch": 0.43, "learning_rate": 3.178152130281868e-06, "loss": 1.1467, "step": 14280 }, { "epoch": 0.43, "learning_rate": 3.177917352576096e-06, "loss": 1.3311, "step": 14281 }, { "epoch": 0.43, "learning_rate": 3.1776825684168765e-06, "loss": 1.0363, "step": 14282 }, { "epoch": 0.43, "learning_rate": 3.177447777806446e-06, "loss": 1.183, "step": 14283 }, { "epoch": 0.43, "learning_rate": 3.1772129807470385e-06, "loss": 1.0611, "step": 14284 }, { "epoch": 0.43, "learning_rate": 3.1769781772408904e-06, "loss": 1.064, "step": 14285 }, { "epoch": 0.43, "learning_rate": 3.1767433672902357e-06, "loss": 1.2284, "step": 14286 }, { "epoch": 0.43, "learning_rate": 3.1765085508973097e-06, "loss": 1.2101, "step": 14287 }, { "epoch": 0.43, "learning_rate": 3.1762737280643486e-06, "loss": 1.1503, "step": 14288 }, { "epoch": 0.43, "learning_rate": 3.1760388987935873e-06, "loss": 1.1031, "step": 14289 }, { "epoch": 0.43, "learning_rate": 3.175804063087261e-06, "loss": 1.1768, "step": 14290 }, { "epoch": 0.43, "learning_rate": 3.1755692209476057e-06, "loss": 1.1407, "step": 14291 }, { "epoch": 0.43, "learning_rate": 3.175334372376857e-06, "loss": 1.2388, "step": 14292 }, { "epoch": 0.43, "learning_rate": 3.1750995173772496e-06, "loss": 1.1313, "step": 14293 }, { "epoch": 0.43, "learning_rate": 3.174864655951021e-06, "loss": 0.96, "step": 14294 }, { "epoch": 0.43, "learning_rate": 3.1746297881004053e-06, "loss": 1.0863, "step": 14295 }, { "epoch": 0.43, "learning_rate": 3.1743949138276386e-06, "loss": 1.1971, "step": 14296 }, { "epoch": 0.43, "learning_rate": 3.174160033134957e-06, "loss": 1.0446, "step": 14297 }, { "epoch": 0.43, "learning_rate": 3.173925146024597e-06, "loss": 1.2078, "step": 14298 }, { "epoch": 0.43, "learning_rate": 3.1736902524987944e-06, "loss": 1.0853, "step": 14299 }, { "epoch": 0.43, "learning_rate": 3.1734553525597846e-06, "loss": 1.1902, "step": 14300 }, { "epoch": 0.43, "learning_rate": 3.1732204462098048e-06, "loss": 1.1483, "step": 14301 }, { "epoch": 0.43, "learning_rate": 3.1729855334510902e-06, "loss": 1.0953, "step": 14302 }, { "epoch": 0.43, "learning_rate": 3.1727506142858776e-06, "loss": 1.0953, "step": 14303 }, { "epoch": 0.43, "learning_rate": 3.1725156887164025e-06, "loss": 1.2421, "step": 14304 }, { "epoch": 0.43, "learning_rate": 3.1722807567449034e-06, "loss": 1.0815, "step": 14305 }, { "epoch": 0.43, "learning_rate": 3.172045818373614e-06, "loss": 1.123, "step": 14306 }, { "epoch": 0.43, "learning_rate": 3.1718108736047724e-06, "loss": 1.0878, "step": 14307 }, { "epoch": 0.43, "learning_rate": 3.1715759224406146e-06, "loss": 1.1474, "step": 14308 }, { "epoch": 0.43, "learning_rate": 3.1713409648833774e-06, "loss": 1.0892, "step": 14309 }, { "epoch": 0.43, "learning_rate": 3.1711060009352978e-06, "loss": 1.0889, "step": 14310 }, { "epoch": 0.43, "learning_rate": 3.1708710305986123e-06, "loss": 1.1325, "step": 14311 }, { "epoch": 0.43, "learning_rate": 3.1706360538755576e-06, "loss": 1.3138, "step": 14312 }, { "epoch": 0.43, "learning_rate": 3.1704010707683707e-06, "loss": 1.1084, "step": 14313 }, { "epoch": 0.43, "learning_rate": 3.170166081279289e-06, "loss": 1.147, "step": 14314 }, { "epoch": 0.43, "learning_rate": 3.169931085410548e-06, "loss": 1.1439, "step": 14315 }, { "epoch": 0.43, "learning_rate": 3.169696083164387e-06, "loss": 1.0834, "step": 14316 }, { "epoch": 0.43, "learning_rate": 3.169461074543041e-06, "loss": 1.1978, "step": 14317 }, { "epoch": 0.43, "learning_rate": 3.1692260595487485e-06, "loss": 1.0435, "step": 14318 }, { "epoch": 0.43, "learning_rate": 3.168991038183745e-06, "loss": 1.1926, "step": 14319 }, { "epoch": 0.43, "learning_rate": 3.16875601045027e-06, "loss": 1.1105, "step": 14320 }, { "epoch": 0.43, "learning_rate": 3.16852097635056e-06, "loss": 1.1488, "step": 14321 }, { "epoch": 0.43, "learning_rate": 3.168285935886852e-06, "loss": 1.1268, "step": 14322 }, { "epoch": 0.43, "learning_rate": 3.168050889061384e-06, "loss": 1.1301, "step": 14323 }, { "epoch": 0.43, "learning_rate": 3.1678158358763923e-06, "loss": 1.1893, "step": 14324 }, { "epoch": 0.43, "learning_rate": 3.167580776334116e-06, "loss": 1.0839, "step": 14325 }, { "epoch": 0.43, "learning_rate": 3.167345710436792e-06, "loss": 1.1366, "step": 14326 }, { "epoch": 0.43, "learning_rate": 3.167110638186659e-06, "loss": 1.0533, "step": 14327 }, { "epoch": 0.43, "learning_rate": 3.1668755595859533e-06, "loss": 1.128, "step": 14328 }, { "epoch": 0.43, "learning_rate": 3.1666404746369145e-06, "loss": 1.1093, "step": 14329 }, { "epoch": 0.43, "learning_rate": 3.1664053833417787e-06, "loss": 1.0778, "step": 14330 }, { "epoch": 0.43, "learning_rate": 3.166170285702785e-06, "loss": 1.1433, "step": 14331 }, { "epoch": 0.43, "learning_rate": 3.16593518172217e-06, "loss": 1.1106, "step": 14332 }, { "epoch": 0.43, "learning_rate": 3.165700071402174e-06, "loss": 1.2061, "step": 14333 }, { "epoch": 0.43, "learning_rate": 3.1654649547450334e-06, "loss": 1.0534, "step": 14334 }, { "epoch": 0.43, "learning_rate": 3.1652298317529866e-06, "loss": 1.1005, "step": 14335 }, { "epoch": 0.43, "learning_rate": 3.1649947024282724e-06, "loss": 1.1218, "step": 14336 }, { "epoch": 0.43, "learning_rate": 3.164759566773129e-06, "loss": 1.1956, "step": 14337 }, { "epoch": 0.43, "learning_rate": 3.1645244247897943e-06, "loss": 1.2141, "step": 14338 }, { "epoch": 0.43, "learning_rate": 3.164289276480508e-06, "loss": 1.1264, "step": 14339 }, { "epoch": 0.43, "learning_rate": 3.1640541218475067e-06, "loss": 1.1403, "step": 14340 }, { "epoch": 0.43, "learning_rate": 3.1638189608930305e-06, "loss": 1.1472, "step": 14341 }, { "epoch": 0.43, "learning_rate": 3.163583793619318e-06, "loss": 1.1417, "step": 14342 }, { "epoch": 0.43, "learning_rate": 3.163348620028607e-06, "loss": 1.0895, "step": 14343 }, { "epoch": 0.43, "learning_rate": 3.163113440123137e-06, "loss": 1.1734, "step": 14344 }, { "epoch": 0.43, "learning_rate": 3.162878253905145e-06, "loss": 1.1373, "step": 14345 }, { "epoch": 0.43, "learning_rate": 3.1626430613768727e-06, "loss": 1.142, "step": 14346 }, { "epoch": 0.43, "learning_rate": 3.162407862540557e-06, "loss": 1.1398, "step": 14347 }, { "epoch": 0.43, "learning_rate": 3.1621726573984377e-06, "loss": 1.0858, "step": 14348 }, { "epoch": 0.43, "learning_rate": 3.161937445952753e-06, "loss": 1.2024, "step": 14349 }, { "epoch": 0.43, "learning_rate": 3.1617022282057432e-06, "loss": 1.141, "step": 14350 }, { "epoch": 0.43, "learning_rate": 3.161467004159646e-06, "loss": 1.1712, "step": 14351 }, { "epoch": 0.43, "learning_rate": 3.161231773816703e-06, "loss": 1.1074, "step": 14352 }, { "epoch": 0.43, "learning_rate": 3.160996537179151e-06, "loss": 1.1931, "step": 14353 }, { "epoch": 0.43, "learning_rate": 3.1607612942492304e-06, "loss": 1.0492, "step": 14354 }, { "epoch": 0.43, "learning_rate": 3.1605260450291807e-06, "loss": 1.1151, "step": 14355 }, { "epoch": 0.43, "learning_rate": 3.1602907895212416e-06, "loss": 1.1874, "step": 14356 }, { "epoch": 0.43, "learning_rate": 3.160055527727652e-06, "loss": 1.1711, "step": 14357 }, { "epoch": 0.43, "learning_rate": 3.159820259650651e-06, "loss": 1.0461, "step": 14358 }, { "epoch": 0.43, "learning_rate": 3.15958498529248e-06, "loss": 1.1038, "step": 14359 }, { "epoch": 0.43, "learning_rate": 3.1593497046553764e-06, "loss": 1.1924, "step": 14360 }, { "epoch": 0.43, "learning_rate": 3.1591144177415816e-06, "loss": 1.09, "step": 14361 }, { "epoch": 0.43, "learning_rate": 3.1588791245533353e-06, "loss": 1.0879, "step": 14362 }, { "epoch": 0.43, "learning_rate": 3.158643825092877e-06, "loss": 1.1073, "step": 14363 }, { "epoch": 0.43, "learning_rate": 3.1584085193624465e-06, "loss": 1.1832, "step": 14364 }, { "epoch": 0.43, "learning_rate": 3.1581732073642835e-06, "loss": 1.0629, "step": 14365 }, { "epoch": 0.43, "learning_rate": 3.157937889100629e-06, "loss": 1.0844, "step": 14366 }, { "epoch": 0.43, "learning_rate": 3.1577025645737224e-06, "loss": 1.0399, "step": 14367 }, { "epoch": 0.43, "learning_rate": 3.1574672337858046e-06, "loss": 0.9993, "step": 14368 }, { "epoch": 0.43, "learning_rate": 3.157231896739115e-06, "loss": 1.1487, "step": 14369 }, { "epoch": 0.43, "learning_rate": 3.1569965534358947e-06, "loss": 1.0917, "step": 14370 }, { "epoch": 0.43, "learning_rate": 3.1567612038783833e-06, "loss": 1.1279, "step": 14371 }, { "epoch": 0.43, "learning_rate": 3.1565258480688226e-06, "loss": 1.1832, "step": 14372 }, { "epoch": 0.43, "learning_rate": 3.1562904860094505e-06, "loss": 1.2256, "step": 14373 }, { "epoch": 0.43, "learning_rate": 3.15605511770251e-06, "loss": 1.1868, "step": 14374 }, { "epoch": 0.43, "learning_rate": 3.15581974315024e-06, "loss": 1.173, "step": 14375 }, { "epoch": 0.43, "learning_rate": 3.1555843623548832e-06, "loss": 1.1124, "step": 14376 }, { "epoch": 0.43, "learning_rate": 3.155348975318678e-06, "loss": 1.1252, "step": 14377 }, { "epoch": 0.43, "learning_rate": 3.155113582043866e-06, "loss": 1.0481, "step": 14378 }, { "epoch": 0.43, "learning_rate": 3.1548781825326883e-06, "loss": 1.0143, "step": 14379 }, { "epoch": 0.43, "learning_rate": 3.1546427767873853e-06, "loss": 1.0847, "step": 14380 }, { "epoch": 0.43, "learning_rate": 3.1544073648101996e-06, "loss": 1.1938, "step": 14381 }, { "epoch": 0.43, "learning_rate": 3.1541719466033703e-06, "loss": 1.0781, "step": 14382 }, { "epoch": 0.43, "learning_rate": 3.15393652216914e-06, "loss": 1.1156, "step": 14383 }, { "epoch": 0.43, "learning_rate": 3.1537010915097476e-06, "loss": 1.1113, "step": 14384 }, { "epoch": 0.43, "learning_rate": 3.153465654627437e-06, "loss": 1.1991, "step": 14385 }, { "epoch": 0.43, "learning_rate": 3.153230211524446e-06, "loss": 1.1505, "step": 14386 }, { "epoch": 0.43, "learning_rate": 3.15299476220302e-06, "loss": 1.1301, "step": 14387 }, { "epoch": 0.43, "learning_rate": 3.152759306665397e-06, "loss": 1.1145, "step": 14388 }, { "epoch": 0.43, "learning_rate": 3.152523844913821e-06, "loss": 1.0922, "step": 14389 }, { "epoch": 0.43, "learning_rate": 3.152288376950532e-06, "loss": 1.1157, "step": 14390 }, { "epoch": 0.43, "learning_rate": 3.152052902777771e-06, "loss": 1.1964, "step": 14391 }, { "epoch": 0.43, "learning_rate": 3.1518174223977806e-06, "loss": 1.1171, "step": 14392 }, { "epoch": 0.43, "learning_rate": 3.1515819358128025e-06, "loss": 1.2173, "step": 14393 }, { "epoch": 0.43, "learning_rate": 3.1513464430250783e-06, "loss": 1.1213, "step": 14394 }, { "epoch": 0.43, "learning_rate": 3.1511109440368494e-06, "loss": 1.1759, "step": 14395 }, { "epoch": 0.43, "learning_rate": 3.1508754388503582e-06, "loss": 1.1537, "step": 14396 }, { "epoch": 0.43, "learning_rate": 3.150639927467846e-06, "loss": 1.0739, "step": 14397 }, { "epoch": 0.43, "learning_rate": 3.150404409891556e-06, "loss": 1.1823, "step": 14398 }, { "epoch": 0.43, "learning_rate": 3.1501688861237277e-06, "loss": 1.1112, "step": 14399 }, { "epoch": 0.43, "learning_rate": 3.1499333561666063e-06, "loss": 1.0705, "step": 14400 }, { "epoch": 0.43, "learning_rate": 3.1496978200224314e-06, "loss": 1.2056, "step": 14401 }, { "epoch": 0.43, "learning_rate": 3.1494622776934463e-06, "loss": 1.1326, "step": 14402 }, { "epoch": 0.43, "learning_rate": 3.1492267291818933e-06, "loss": 1.0812, "step": 14403 }, { "epoch": 0.43, "learning_rate": 3.1489911744900143e-06, "loss": 1.2069, "step": 14404 }, { "epoch": 0.43, "learning_rate": 3.148755613620052e-06, "loss": 1.01, "step": 14405 }, { "epoch": 0.43, "learning_rate": 3.148520046574248e-06, "loss": 1.221, "step": 14406 }, { "epoch": 0.43, "learning_rate": 3.148284473354847e-06, "loss": 1.0806, "step": 14407 }, { "epoch": 0.43, "learning_rate": 3.1480488939640886e-06, "loss": 1.1223, "step": 14408 }, { "epoch": 0.43, "learning_rate": 3.1478133084042174e-06, "loss": 1.0939, "step": 14409 }, { "epoch": 0.43, "learning_rate": 3.147577716677476e-06, "loss": 1.102, "step": 14410 }, { "epoch": 0.43, "learning_rate": 3.147342118786106e-06, "loss": 1.1076, "step": 14411 }, { "epoch": 0.43, "learning_rate": 3.147106514732351e-06, "loss": 1.2448, "step": 14412 }, { "epoch": 0.43, "learning_rate": 3.146870904518454e-06, "loss": 1.1972, "step": 14413 }, { "epoch": 0.43, "learning_rate": 3.1466352881466567e-06, "loss": 1.0884, "step": 14414 }, { "epoch": 0.43, "learning_rate": 3.1463996656192035e-06, "loss": 1.0731, "step": 14415 }, { "epoch": 0.43, "learning_rate": 3.1461640369383364e-06, "loss": 1.0809, "step": 14416 }, { "epoch": 0.43, "learning_rate": 3.1459284021063e-06, "loss": 1.1712, "step": 14417 }, { "epoch": 0.43, "learning_rate": 3.1456927611253347e-06, "loss": 1.0017, "step": 14418 }, { "epoch": 0.43, "learning_rate": 3.1454571139976858e-06, "loss": 0.9836, "step": 14419 }, { "epoch": 0.43, "learning_rate": 3.145221460725596e-06, "loss": 1.1105, "step": 14420 }, { "epoch": 0.43, "learning_rate": 3.1449858013113088e-06, "loss": 1.136, "step": 14421 }, { "epoch": 0.43, "learning_rate": 3.1447501357570675e-06, "loss": 1.0542, "step": 14422 }, { "epoch": 0.43, "learning_rate": 3.1445144640651153e-06, "loss": 1.1989, "step": 14423 }, { "epoch": 0.43, "learning_rate": 3.144278786237696e-06, "loss": 1.0706, "step": 14424 }, { "epoch": 0.43, "learning_rate": 3.1440431022770528e-06, "loss": 1.0541, "step": 14425 }, { "epoch": 0.43, "learning_rate": 3.14380741218543e-06, "loss": 1.0825, "step": 14426 }, { "epoch": 0.43, "learning_rate": 3.1435717159650702e-06, "loss": 1.1797, "step": 14427 }, { "epoch": 0.43, "learning_rate": 3.1433360136182177e-06, "loss": 1.0937, "step": 14428 }, { "epoch": 0.43, "learning_rate": 3.143100305147116e-06, "loss": 1.2047, "step": 14429 }, { "epoch": 0.43, "learning_rate": 3.1428645905540096e-06, "loss": 1.2203, "step": 14430 }, { "epoch": 0.43, "learning_rate": 3.142628869841141e-06, "loss": 1.0893, "step": 14431 }, { "epoch": 0.43, "learning_rate": 3.1423931430107556e-06, "loss": 1.1216, "step": 14432 }, { "epoch": 0.43, "learning_rate": 3.1421574100650966e-06, "loss": 1.187, "step": 14433 }, { "epoch": 0.43, "learning_rate": 3.141921671006408e-06, "loss": 1.1332, "step": 14434 }, { "epoch": 0.43, "learning_rate": 3.141685925836936e-06, "loss": 1.0444, "step": 14435 }, { "epoch": 0.43, "learning_rate": 3.1414501745589217e-06, "loss": 1.1168, "step": 14436 }, { "epoch": 0.43, "learning_rate": 3.1412144171746105e-06, "loss": 1.1851, "step": 14437 }, { "epoch": 0.43, "learning_rate": 3.1409786536862475e-06, "loss": 1.2495, "step": 14438 }, { "epoch": 0.43, "learning_rate": 3.1407428840960764e-06, "loss": 1.1439, "step": 14439 }, { "epoch": 0.44, "learning_rate": 3.140507108406341e-06, "loss": 1.0628, "step": 14440 }, { "epoch": 0.44, "learning_rate": 3.1402713266192876e-06, "loss": 1.0966, "step": 14441 }, { "epoch": 0.44, "learning_rate": 3.1400355387371583e-06, "loss": 1.137, "step": 14442 }, { "epoch": 0.44, "learning_rate": 3.1397997447621995e-06, "loss": 1.2222, "step": 14443 }, { "epoch": 0.44, "learning_rate": 3.1395639446966554e-06, "loss": 1.1062, "step": 14444 }, { "epoch": 0.44, "learning_rate": 3.1393281385427698e-06, "loss": 1.223, "step": 14445 }, { "epoch": 0.44, "learning_rate": 3.139092326302789e-06, "loss": 0.9894, "step": 14446 }, { "epoch": 0.44, "learning_rate": 3.1388565079789567e-06, "loss": 1.1459, "step": 14447 }, { "epoch": 0.44, "learning_rate": 3.1386206835735176e-06, "loss": 1.0623, "step": 14448 }, { "epoch": 0.44, "learning_rate": 3.1383848530887177e-06, "loss": 1.1663, "step": 14449 }, { "epoch": 0.44, "learning_rate": 3.138149016526802e-06, "loss": 1.2413, "step": 14450 }, { "epoch": 0.44, "learning_rate": 3.1379131738900142e-06, "loss": 1.0649, "step": 14451 }, { "epoch": 0.44, "learning_rate": 3.1376773251806012e-06, "loss": 1.0795, "step": 14452 }, { "epoch": 0.44, "learning_rate": 3.137441470400806e-06, "loss": 1.1153, "step": 14453 }, { "epoch": 0.44, "learning_rate": 3.137205609552876e-06, "loss": 1.1333, "step": 14454 }, { "epoch": 0.44, "learning_rate": 3.136969742639055e-06, "loss": 1.1064, "step": 14455 }, { "epoch": 0.44, "learning_rate": 3.136733869661589e-06, "loss": 1.0643, "step": 14456 }, { "epoch": 0.44, "learning_rate": 3.1364979906227226e-06, "loss": 1.0916, "step": 14457 }, { "epoch": 0.44, "learning_rate": 3.136262105524702e-06, "loss": 1.1248, "step": 14458 }, { "epoch": 0.44, "learning_rate": 3.136026214369774e-06, "loss": 1.0629, "step": 14459 }, { "epoch": 0.44, "learning_rate": 3.135790317160181e-06, "loss": 1.1334, "step": 14460 }, { "epoch": 0.44, "learning_rate": 3.1355544138981707e-06, "loss": 1.1006, "step": 14461 }, { "epoch": 0.44, "learning_rate": 3.135318504585989e-06, "loss": 1.1219, "step": 14462 }, { "epoch": 0.44, "learning_rate": 3.1350825892258814e-06, "loss": 1.2203, "step": 14463 }, { "epoch": 0.44, "learning_rate": 3.1348466678200927e-06, "loss": 1.1047, "step": 14464 }, { "epoch": 0.44, "learning_rate": 3.1346107403708704e-06, "loss": 1.131, "step": 14465 }, { "epoch": 0.44, "learning_rate": 3.134374806880458e-06, "loss": 1.1085, "step": 14466 }, { "epoch": 0.44, "learning_rate": 3.1341388673511043e-06, "loss": 0.975, "step": 14467 }, { "epoch": 0.44, "learning_rate": 3.1339029217850535e-06, "loss": 1.1403, "step": 14468 }, { "epoch": 0.44, "learning_rate": 3.1336669701845524e-06, "loss": 1.0977, "step": 14469 }, { "epoch": 0.44, "learning_rate": 3.1334310125518464e-06, "loss": 1.0947, "step": 14470 }, { "epoch": 0.44, "learning_rate": 3.1331950488891827e-06, "loss": 1.1147, "step": 14471 }, { "epoch": 0.44, "learning_rate": 3.1329590791988073e-06, "loss": 1.1459, "step": 14472 }, { "epoch": 0.44, "learning_rate": 3.1327231034829656e-06, "loss": 1.0631, "step": 14473 }, { "epoch": 0.44, "learning_rate": 3.1324871217439044e-06, "loss": 1.0477, "step": 14474 }, { "epoch": 0.44, "learning_rate": 3.1322511339838713e-06, "loss": 1.2692, "step": 14475 }, { "epoch": 0.44, "learning_rate": 3.1320151402051117e-06, "loss": 1.1641, "step": 14476 }, { "epoch": 0.44, "learning_rate": 3.1317791404098724e-06, "loss": 1.1495, "step": 14477 }, { "epoch": 0.44, "learning_rate": 3.1315431346004e-06, "loss": 1.1418, "step": 14478 }, { "epoch": 0.44, "learning_rate": 3.131307122778941e-06, "loss": 1.1943, "step": 14479 }, { "epoch": 0.44, "learning_rate": 3.131071104947743e-06, "loss": 1.1147, "step": 14480 }, { "epoch": 0.44, "learning_rate": 3.1308350811090502e-06, "loss": 1.1876, "step": 14481 }, { "epoch": 0.44, "learning_rate": 3.130599051265113e-06, "loss": 1.1552, "step": 14482 }, { "epoch": 0.44, "learning_rate": 3.130363015418176e-06, "loss": 0.9672, "step": 14483 }, { "epoch": 0.44, "learning_rate": 3.1301269735704867e-06, "loss": 1.1918, "step": 14484 }, { "epoch": 0.44, "learning_rate": 3.1298909257242914e-06, "loss": 1.1671, "step": 14485 }, { "epoch": 0.44, "learning_rate": 3.129654871881838e-06, "loss": 1.1631, "step": 14486 }, { "epoch": 0.44, "learning_rate": 3.1294188120453744e-06, "loss": 1.0991, "step": 14487 }, { "epoch": 0.44, "learning_rate": 3.1291827462171466e-06, "loss": 1.0798, "step": 14488 }, { "epoch": 0.44, "learning_rate": 3.1289466743994014e-06, "loss": 1.1703, "step": 14489 }, { "epoch": 0.44, "learning_rate": 3.1287105965943864e-06, "loss": 1.0104, "step": 14490 }, { "epoch": 0.44, "learning_rate": 3.12847451280435e-06, "loss": 1.1605, "step": 14491 }, { "epoch": 0.44, "learning_rate": 3.1282384230315394e-06, "loss": 1.1428, "step": 14492 }, { "epoch": 0.44, "learning_rate": 3.1280023272782012e-06, "loss": 1.125, "step": 14493 }, { "epoch": 0.44, "learning_rate": 3.1277662255465833e-06, "loss": 1.1482, "step": 14494 }, { "epoch": 0.44, "learning_rate": 3.127530117838934e-06, "loss": 1.1522, "step": 14495 }, { "epoch": 0.44, "learning_rate": 3.127294004157499e-06, "loss": 1.1309, "step": 14496 }, { "epoch": 0.44, "learning_rate": 3.1270578845045278e-06, "loss": 1.0038, "step": 14497 }, { "epoch": 0.44, "learning_rate": 3.1268217588822668e-06, "loss": 0.9516, "step": 14498 }, { "epoch": 0.44, "learning_rate": 3.1265856272929653e-06, "loss": 1.1858, "step": 14499 }, { "epoch": 0.44, "learning_rate": 3.126349489738871e-06, "loss": 1.1679, "step": 14500 }, { "epoch": 0.44, "learning_rate": 3.12611334622223e-06, "loss": 1.0595, "step": 14501 }, { "epoch": 0.44, "learning_rate": 3.1258771967452915e-06, "loss": 1.1105, "step": 14502 }, { "epoch": 0.44, "learning_rate": 3.125641041310304e-06, "loss": 1.07, "step": 14503 }, { "epoch": 0.44, "learning_rate": 3.1254048799195154e-06, "loss": 1.2601, "step": 14504 }, { "epoch": 0.44, "learning_rate": 3.125168712575173e-06, "loss": 1.1685, "step": 14505 }, { "epoch": 0.44, "learning_rate": 3.124932539279526e-06, "loss": 1.0782, "step": 14506 }, { "epoch": 0.44, "learning_rate": 3.124696360034822e-06, "loss": 1.1272, "step": 14507 }, { "epoch": 0.44, "learning_rate": 3.1244601748433095e-06, "loss": 1.1246, "step": 14508 }, { "epoch": 0.44, "learning_rate": 3.1242239837072365e-06, "loss": 1.052, "step": 14509 }, { "epoch": 0.44, "learning_rate": 3.1239877866288525e-06, "loss": 1.0645, "step": 14510 }, { "epoch": 0.44, "learning_rate": 3.123751583610405e-06, "loss": 1.1913, "step": 14511 }, { "epoch": 0.44, "learning_rate": 3.1235153746541423e-06, "loss": 1.0843, "step": 14512 }, { "epoch": 0.44, "learning_rate": 3.1232791597623145e-06, "loss": 1.1273, "step": 14513 }, { "epoch": 0.44, "learning_rate": 3.1230429389371684e-06, "loss": 1.1821, "step": 14514 }, { "epoch": 0.44, "learning_rate": 3.122806712180954e-06, "loss": 1.1693, "step": 14515 }, { "epoch": 0.44, "learning_rate": 3.1225704794959193e-06, "loss": 1.0835, "step": 14516 }, { "epoch": 0.44, "learning_rate": 3.1223342408843145e-06, "loss": 1.0511, "step": 14517 }, { "epoch": 0.44, "learning_rate": 3.1220979963483864e-06, "loss": 1.1731, "step": 14518 }, { "epoch": 0.44, "learning_rate": 3.1218617458903855e-06, "loss": 1.215, "step": 14519 }, { "epoch": 0.44, "learning_rate": 3.1216254895125603e-06, "loss": 1.1563, "step": 14520 }, { "epoch": 0.44, "learning_rate": 3.1213892272171596e-06, "loss": 1.0853, "step": 14521 }, { "epoch": 0.44, "learning_rate": 3.121152959006433e-06, "loss": 1.0331, "step": 14522 }, { "epoch": 0.44, "learning_rate": 3.1209166848826295e-06, "loss": 1.2539, "step": 14523 }, { "epoch": 0.44, "learning_rate": 3.120680404847998e-06, "loss": 0.9869, "step": 14524 }, { "epoch": 0.44, "learning_rate": 3.1204441189047874e-06, "loss": 1.2009, "step": 14525 }, { "epoch": 0.44, "learning_rate": 3.1202078270552485e-06, "loss": 1.1547, "step": 14526 }, { "epoch": 0.44, "learning_rate": 3.119971529301629e-06, "loss": 1.2014, "step": 14527 }, { "epoch": 0.44, "learning_rate": 3.11973522564618e-06, "loss": 1.1063, "step": 14528 }, { "epoch": 0.44, "learning_rate": 3.1194989160911495e-06, "loss": 1.057, "step": 14529 }, { "epoch": 0.44, "learning_rate": 3.119262600638787e-06, "loss": 1.1677, "step": 14530 }, { "epoch": 0.44, "learning_rate": 3.119026279291344e-06, "loss": 1.1782, "step": 14531 }, { "epoch": 0.44, "learning_rate": 3.1187899520510685e-06, "loss": 1.1346, "step": 14532 }, { "epoch": 0.44, "learning_rate": 3.1185536189202104e-06, "loss": 1.0784, "step": 14533 }, { "epoch": 0.44, "learning_rate": 3.1183172799010207e-06, "loss": 1.0934, "step": 14534 }, { "epoch": 0.44, "learning_rate": 3.1180809349957473e-06, "loss": 1.1409, "step": 14535 }, { "epoch": 0.44, "learning_rate": 3.1178445842066417e-06, "loss": 1.2029, "step": 14536 }, { "epoch": 0.44, "learning_rate": 3.117608227535953e-06, "loss": 1.2406, "step": 14537 }, { "epoch": 0.44, "learning_rate": 3.1173718649859307e-06, "loss": 1.0963, "step": 14538 }, { "epoch": 0.44, "learning_rate": 3.117135496558827e-06, "loss": 1.0762, "step": 14539 }, { "epoch": 0.44, "learning_rate": 3.1168991222568896e-06, "loss": 1.1332, "step": 14540 }, { "epoch": 0.44, "learning_rate": 3.1166627420823705e-06, "loss": 0.9948, "step": 14541 }, { "epoch": 0.44, "learning_rate": 3.116426356037518e-06, "loss": 1.1776, "step": 14542 }, { "epoch": 0.44, "learning_rate": 3.116189964124584e-06, "loss": 1.2463, "step": 14543 }, { "epoch": 0.44, "learning_rate": 3.115953566345818e-06, "loss": 1.1367, "step": 14544 }, { "epoch": 0.44, "learning_rate": 3.115717162703471e-06, "loss": 1.1373, "step": 14545 }, { "epoch": 0.44, "learning_rate": 3.115480753199793e-06, "loss": 1.1202, "step": 14546 }, { "epoch": 0.44, "learning_rate": 3.115244337837035e-06, "loss": 1.1669, "step": 14547 }, { "epoch": 0.44, "learning_rate": 3.1150079166174474e-06, "loss": 1.1147, "step": 14548 }, { "epoch": 0.44, "learning_rate": 3.11477148954328e-06, "loss": 1.2626, "step": 14549 }, { "epoch": 0.44, "learning_rate": 3.114535056616784e-06, "loss": 1.1511, "step": 14550 }, { "epoch": 0.44, "learning_rate": 3.114298617840211e-06, "loss": 1.1161, "step": 14551 }, { "epoch": 0.44, "learning_rate": 3.1140621732158103e-06, "loss": 1.1277, "step": 14552 }, { "epoch": 0.44, "learning_rate": 3.113825722745834e-06, "loss": 1.0533, "step": 14553 }, { "epoch": 0.44, "learning_rate": 3.1135892664325322e-06, "loss": 1.0243, "step": 14554 }, { "epoch": 0.44, "learning_rate": 3.1133528042781563e-06, "loss": 1.0983, "step": 14555 }, { "epoch": 0.44, "learning_rate": 3.1131163362849566e-06, "loss": 1.2218, "step": 14556 }, { "epoch": 0.44, "learning_rate": 3.112879862455185e-06, "loss": 1.0516, "step": 14557 }, { "epoch": 0.44, "learning_rate": 3.1126433827910924e-06, "loss": 1.217, "step": 14558 }, { "epoch": 0.44, "learning_rate": 3.1124068972949296e-06, "loss": 1.0938, "step": 14559 }, { "epoch": 0.44, "learning_rate": 3.1121704059689482e-06, "loss": 1.1837, "step": 14560 }, { "epoch": 0.44, "learning_rate": 3.1119339088153992e-06, "loss": 1.1603, "step": 14561 }, { "epoch": 0.44, "learning_rate": 3.1116974058365344e-06, "loss": 1.2167, "step": 14562 }, { "epoch": 0.44, "learning_rate": 3.111460897034605e-06, "loss": 1.0822, "step": 14563 }, { "epoch": 0.44, "learning_rate": 3.1112243824118614e-06, "loss": 1.1799, "step": 14564 }, { "epoch": 0.44, "learning_rate": 3.1109878619705573e-06, "loss": 1.0494, "step": 14565 }, { "epoch": 0.44, "learning_rate": 3.1107513357129427e-06, "loss": 1.1968, "step": 14566 }, { "epoch": 0.44, "learning_rate": 3.1105148036412693e-06, "loss": 1.1229, "step": 14567 }, { "epoch": 0.44, "learning_rate": 3.110278265757789e-06, "loss": 1.2633, "step": 14568 }, { "epoch": 0.44, "learning_rate": 3.1100417220647538e-06, "loss": 1.1929, "step": 14569 }, { "epoch": 0.44, "learning_rate": 3.1098051725644145e-06, "loss": 1.1324, "step": 14570 }, { "epoch": 0.44, "learning_rate": 3.1095686172590238e-06, "loss": 1.0799, "step": 14571 }, { "epoch": 0.44, "learning_rate": 3.109332056150834e-06, "loss": 1.2193, "step": 14572 }, { "epoch": 0.44, "learning_rate": 3.1090954892420965e-06, "loss": 1.1339, "step": 14573 }, { "epoch": 0.44, "learning_rate": 3.108858916535063e-06, "loss": 1.0118, "step": 14574 }, { "epoch": 0.44, "learning_rate": 3.1086223380319858e-06, "loss": 1.1125, "step": 14575 }, { "epoch": 0.44, "learning_rate": 3.108385753735117e-06, "loss": 1.0933, "step": 14576 }, { "epoch": 0.44, "learning_rate": 3.1081491636467093e-06, "loss": 1.1613, "step": 14577 }, { "epoch": 0.44, "learning_rate": 3.1079125677690143e-06, "loss": 1.0859, "step": 14578 }, { "epoch": 0.44, "learning_rate": 3.107675966104284e-06, "loss": 1.1061, "step": 14579 }, { "epoch": 0.44, "learning_rate": 3.107439358654772e-06, "loss": 1.1367, "step": 14580 }, { "epoch": 0.44, "learning_rate": 3.107202745422729e-06, "loss": 1.153, "step": 14581 }, { "epoch": 0.44, "learning_rate": 3.106966126410409e-06, "loss": 0.9921, "step": 14582 }, { "epoch": 0.44, "learning_rate": 3.106729501620063e-06, "loss": 1.2466, "step": 14583 }, { "epoch": 0.44, "learning_rate": 3.1064928710539445e-06, "loss": 1.1276, "step": 14584 }, { "epoch": 0.44, "learning_rate": 3.106256234714306e-06, "loss": 1.1469, "step": 14585 }, { "epoch": 0.44, "learning_rate": 3.1060195926034008e-06, "loss": 1.2028, "step": 14586 }, { "epoch": 0.44, "learning_rate": 3.10578294472348e-06, "loss": 1.0746, "step": 14587 }, { "epoch": 0.44, "learning_rate": 3.1055462910767984e-06, "loss": 1.1592, "step": 14588 }, { "epoch": 0.44, "learning_rate": 3.1053096316656066e-06, "loss": 1.1341, "step": 14589 }, { "epoch": 0.44, "learning_rate": 3.1050729664921597e-06, "loss": 1.1014, "step": 14590 }, { "epoch": 0.44, "learning_rate": 3.1048362955587092e-06, "loss": 1.0673, "step": 14591 }, { "epoch": 0.44, "learning_rate": 3.1045996188675083e-06, "loss": 1.1321, "step": 14592 }, { "epoch": 0.44, "learning_rate": 3.1043629364208107e-06, "loss": 1.2352, "step": 14593 }, { "epoch": 0.44, "learning_rate": 3.1041262482208676e-06, "loss": 1.1136, "step": 14594 }, { "epoch": 0.44, "learning_rate": 3.1038895542699355e-06, "loss": 1.1023, "step": 14595 }, { "epoch": 0.44, "learning_rate": 3.1036528545702644e-06, "loss": 1.0204, "step": 14596 }, { "epoch": 0.44, "learning_rate": 3.103416149124109e-06, "loss": 1.1186, "step": 14597 }, { "epoch": 0.44, "learning_rate": 3.103179437933722e-06, "loss": 1.1667, "step": 14598 }, { "epoch": 0.44, "learning_rate": 3.1029427210013585e-06, "loss": 1.1467, "step": 14599 }, { "epoch": 0.44, "learning_rate": 3.10270599832927e-06, "loss": 1.1736, "step": 14600 }, { "epoch": 0.44, "learning_rate": 3.102469269919711e-06, "loss": 1.121, "step": 14601 }, { "epoch": 0.44, "learning_rate": 3.1022325357749344e-06, "loss": 1.0945, "step": 14602 }, { "epoch": 0.44, "learning_rate": 3.101995795897195e-06, "loss": 1.0612, "step": 14603 }, { "epoch": 0.44, "learning_rate": 3.1017590502887442e-06, "loss": 1.1653, "step": 14604 }, { "epoch": 0.44, "learning_rate": 3.1015222989518373e-06, "loss": 1.2545, "step": 14605 }, { "epoch": 0.44, "learning_rate": 3.1012855418887284e-06, "loss": 1.1232, "step": 14606 }, { "epoch": 0.44, "learning_rate": 3.1010487791016703e-06, "loss": 1.1832, "step": 14607 }, { "epoch": 0.44, "learning_rate": 3.1008120105929173e-06, "loss": 1.0968, "step": 14608 }, { "epoch": 0.44, "learning_rate": 3.1005752363647235e-06, "loss": 1.1289, "step": 14609 }, { "epoch": 0.44, "learning_rate": 3.1003384564193427e-06, "loss": 1.1951, "step": 14610 }, { "epoch": 0.44, "learning_rate": 3.1001016707590293e-06, "loss": 1.2086, "step": 14611 }, { "epoch": 0.44, "learning_rate": 3.099864879386036e-06, "loss": 1.0373, "step": 14612 }, { "epoch": 0.44, "learning_rate": 3.099628082302618e-06, "loss": 1.1238, "step": 14613 }, { "epoch": 0.44, "learning_rate": 3.099391279511031e-06, "loss": 1.0614, "step": 14614 }, { "epoch": 0.44, "learning_rate": 3.0991544710135263e-06, "loss": 1.1411, "step": 14615 }, { "epoch": 0.44, "learning_rate": 3.0989176568123603e-06, "loss": 1.007, "step": 14616 }, { "epoch": 0.44, "learning_rate": 3.098680836909786e-06, "loss": 1.1929, "step": 14617 }, { "epoch": 0.44, "learning_rate": 3.0984440113080586e-06, "loss": 1.1612, "step": 14618 }, { "epoch": 0.44, "learning_rate": 3.098207180009433e-06, "loss": 1.1599, "step": 14619 }, { "epoch": 0.44, "learning_rate": 3.097970343016163e-06, "loss": 1.0674, "step": 14620 }, { "epoch": 0.44, "learning_rate": 3.0977335003305033e-06, "loss": 1.0992, "step": 14621 }, { "epoch": 0.44, "learning_rate": 3.097496651954708e-06, "loss": 1.1409, "step": 14622 }, { "epoch": 0.44, "learning_rate": 3.097259797891033e-06, "loss": 1.1318, "step": 14623 }, { "epoch": 0.44, "learning_rate": 3.097022938141732e-06, "loss": 1.2057, "step": 14624 }, { "epoch": 0.44, "learning_rate": 3.0967860727090598e-06, "loss": 1.2011, "step": 14625 }, { "epoch": 0.44, "learning_rate": 3.096549201595272e-06, "loss": 1.0654, "step": 14626 }, { "epoch": 0.44, "learning_rate": 3.096312324802624e-06, "loss": 1.0894, "step": 14627 }, { "epoch": 0.44, "learning_rate": 3.0960754423333684e-06, "loss": 1.0469, "step": 14628 }, { "epoch": 0.44, "learning_rate": 3.095838554189763e-06, "loss": 1.1129, "step": 14629 }, { "epoch": 0.44, "learning_rate": 3.09560166037406e-06, "loss": 1.2709, "step": 14630 }, { "epoch": 0.44, "learning_rate": 3.0953647608885173e-06, "loss": 1.1896, "step": 14631 }, { "epoch": 0.44, "learning_rate": 3.0951278557353887e-06, "loss": 1.0833, "step": 14632 }, { "epoch": 0.44, "learning_rate": 3.094890944916929e-06, "loss": 1.1313, "step": 14633 }, { "epoch": 0.44, "learning_rate": 3.0946540284353943e-06, "loss": 0.9858, "step": 14634 }, { "epoch": 0.44, "learning_rate": 3.0944171062930395e-06, "loss": 1.2241, "step": 14635 }, { "epoch": 0.44, "learning_rate": 3.0941801784921205e-06, "loss": 1.265, "step": 14636 }, { "epoch": 0.44, "learning_rate": 3.0939432450348916e-06, "loss": 1.1143, "step": 14637 }, { "epoch": 0.44, "learning_rate": 3.0937063059236094e-06, "loss": 1.1542, "step": 14638 }, { "epoch": 0.44, "learning_rate": 3.0934693611605295e-06, "loss": 1.1279, "step": 14639 }, { "epoch": 0.44, "learning_rate": 3.093232410747907e-06, "loss": 0.989, "step": 14640 }, { "epoch": 0.44, "learning_rate": 3.0929954546879975e-06, "loss": 1.0112, "step": 14641 }, { "epoch": 0.44, "learning_rate": 3.092758492983057e-06, "loss": 1.1883, "step": 14642 }, { "epoch": 0.44, "learning_rate": 3.092521525635341e-06, "loss": 1.1767, "step": 14643 }, { "epoch": 0.44, "learning_rate": 3.092284552647105e-06, "loss": 1.098, "step": 14644 }, { "epoch": 0.44, "learning_rate": 3.0920475740206064e-06, "loss": 1.1931, "step": 14645 }, { "epoch": 0.44, "learning_rate": 3.091810589758099e-06, "loss": 1.0893, "step": 14646 }, { "epoch": 0.44, "learning_rate": 3.0915735998618406e-06, "loss": 1.1791, "step": 14647 }, { "epoch": 0.44, "learning_rate": 3.091336604334086e-06, "loss": 1.0649, "step": 14648 }, { "epoch": 0.44, "learning_rate": 3.0910996031770916e-06, "loss": 1.1564, "step": 14649 }, { "epoch": 0.44, "learning_rate": 3.0908625963931137e-06, "loss": 1.1019, "step": 14650 }, { "epoch": 0.44, "learning_rate": 3.0906255839844093e-06, "loss": 1.1213, "step": 14651 }, { "epoch": 0.44, "learning_rate": 3.0903885659532327e-06, "loss": 1.064, "step": 14652 }, { "epoch": 0.44, "learning_rate": 3.0901515423018417e-06, "loss": 1.0818, "step": 14653 }, { "epoch": 0.44, "learning_rate": 3.089914513032492e-06, "loss": 1.2269, "step": 14654 }, { "epoch": 0.44, "learning_rate": 3.089677478147441e-06, "loss": 1.1635, "step": 14655 }, { "epoch": 0.44, "learning_rate": 3.0894404376489433e-06, "loss": 1.135, "step": 14656 }, { "epoch": 0.44, "learning_rate": 3.0892033915392573e-06, "loss": 1.1979, "step": 14657 }, { "epoch": 0.44, "learning_rate": 3.088966339820639e-06, "loss": 1.0381, "step": 14658 }, { "epoch": 0.44, "learning_rate": 3.088729282495344e-06, "loss": 1.182, "step": 14659 }, { "epoch": 0.44, "learning_rate": 3.0884922195656304e-06, "loss": 1.1091, "step": 14660 }, { "epoch": 0.44, "learning_rate": 3.088255151033754e-06, "loss": 1.0689, "step": 14661 }, { "epoch": 0.44, "learning_rate": 3.0880180769019718e-06, "loss": 1.1868, "step": 14662 }, { "epoch": 0.44, "learning_rate": 3.087780997172541e-06, "loss": 1.106, "step": 14663 }, { "epoch": 0.44, "learning_rate": 3.0875439118477184e-06, "loss": 1.1465, "step": 14664 }, { "epoch": 0.44, "learning_rate": 3.0873068209297604e-06, "loss": 1.1614, "step": 14665 }, { "epoch": 0.44, "learning_rate": 3.0870697244209236e-06, "loss": 1.1969, "step": 14666 }, { "epoch": 0.44, "learning_rate": 3.0868326223234664e-06, "loss": 1.127, "step": 14667 }, { "epoch": 0.44, "learning_rate": 3.086595514639646e-06, "loss": 1.2479, "step": 14668 }, { "epoch": 0.44, "learning_rate": 3.0863584013717174e-06, "loss": 1.1121, "step": 14669 }, { "epoch": 0.44, "learning_rate": 3.0861212825219407e-06, "loss": 1.2092, "step": 14670 }, { "epoch": 0.44, "learning_rate": 3.0858841580925704e-06, "loss": 1.1615, "step": 14671 }, { "epoch": 0.44, "learning_rate": 3.085647028085865e-06, "loss": 1.1111, "step": 14672 }, { "epoch": 0.44, "learning_rate": 3.0854098925040833e-06, "loss": 1.1444, "step": 14673 }, { "epoch": 0.44, "learning_rate": 3.0851727513494808e-06, "loss": 1.2431, "step": 14674 }, { "epoch": 0.44, "learning_rate": 3.0849356046243157e-06, "loss": 1.1693, "step": 14675 }, { "epoch": 0.44, "learning_rate": 3.0846984523308445e-06, "loss": 1.1588, "step": 14676 }, { "epoch": 0.44, "learning_rate": 3.0844612944713267e-06, "loss": 1.1873, "step": 14677 }, { "epoch": 0.44, "learning_rate": 3.084224131048018e-06, "loss": 1.113, "step": 14678 }, { "epoch": 0.44, "learning_rate": 3.0839869620631768e-06, "loss": 1.1453, "step": 14679 }, { "epoch": 0.44, "learning_rate": 3.0837497875190615e-06, "loss": 1.1719, "step": 14680 }, { "epoch": 0.44, "learning_rate": 3.0835126074179293e-06, "loss": 1.1417, "step": 14681 }, { "epoch": 0.44, "learning_rate": 3.083275421762038e-06, "loss": 1.0988, "step": 14682 }, { "epoch": 0.44, "learning_rate": 3.083038230553646e-06, "loss": 1.1409, "step": 14683 }, { "epoch": 0.44, "learning_rate": 3.0828010337950105e-06, "loss": 1.115, "step": 14684 }, { "epoch": 0.44, "learning_rate": 3.08256383148839e-06, "loss": 1.1482, "step": 14685 }, { "epoch": 0.44, "learning_rate": 3.0823266236360428e-06, "loss": 1.1849, "step": 14686 }, { "epoch": 0.44, "learning_rate": 3.0820894102402253e-06, "loss": 1.2848, "step": 14687 }, { "epoch": 0.44, "learning_rate": 3.0818521913031984e-06, "loss": 1.0839, "step": 14688 }, { "epoch": 0.44, "learning_rate": 3.0816149668272176e-06, "loss": 1.0945, "step": 14689 }, { "epoch": 0.44, "learning_rate": 3.0813777368145437e-06, "loss": 1.1216, "step": 14690 }, { "epoch": 0.44, "learning_rate": 3.0811405012674327e-06, "loss": 1.1013, "step": 14691 }, { "epoch": 0.44, "learning_rate": 3.0809032601881446e-06, "loss": 1.1941, "step": 14692 }, { "epoch": 0.44, "learning_rate": 3.0806660135789375e-06, "loss": 1.0532, "step": 14693 }, { "epoch": 0.44, "learning_rate": 3.0804287614420684e-06, "loss": 1.1483, "step": 14694 }, { "epoch": 0.44, "learning_rate": 3.080191503779798e-06, "loss": 1.1666, "step": 14695 }, { "epoch": 0.44, "learning_rate": 3.079954240594384e-06, "loss": 1.1475, "step": 14696 }, { "epoch": 0.44, "learning_rate": 3.079716971888084e-06, "loss": 1.1516, "step": 14697 }, { "epoch": 0.44, "learning_rate": 3.0794796976631585e-06, "loss": 1.1373, "step": 14698 }, { "epoch": 0.44, "learning_rate": 3.0792424179218655e-06, "loss": 1.178, "step": 14699 }, { "epoch": 0.44, "learning_rate": 3.0790051326664634e-06, "loss": 1.2847, "step": 14700 }, { "epoch": 0.44, "learning_rate": 3.0787678418992112e-06, "loss": 1.0834, "step": 14701 }, { "epoch": 0.44, "learning_rate": 3.078530545622368e-06, "loss": 1.1385, "step": 14702 }, { "epoch": 0.44, "learning_rate": 3.078293243838193e-06, "loss": 1.176, "step": 14703 }, { "epoch": 0.44, "learning_rate": 3.078055936548944e-06, "loss": 1.0701, "step": 14704 }, { "epoch": 0.44, "learning_rate": 3.0778186237568814e-06, "loss": 1.0605, "step": 14705 }, { "epoch": 0.44, "learning_rate": 3.0775813054642632e-06, "loss": 1.2028, "step": 14706 }, { "epoch": 0.44, "learning_rate": 3.0773439816733496e-06, "loss": 1.1182, "step": 14707 }, { "epoch": 0.44, "learning_rate": 3.077106652386399e-06, "loss": 1.0781, "step": 14708 }, { "epoch": 0.44, "learning_rate": 3.076869317605672e-06, "loss": 1.1337, "step": 14709 }, { "epoch": 0.44, "learning_rate": 3.076631977333426e-06, "loss": 1.1226, "step": 14710 }, { "epoch": 0.44, "learning_rate": 3.0763946315719213e-06, "loss": 1.0858, "step": 14711 }, { "epoch": 0.44, "learning_rate": 3.076157280323418e-06, "loss": 1.1463, "step": 14712 }, { "epoch": 0.44, "learning_rate": 3.0759199235901745e-06, "loss": 1.1273, "step": 14713 }, { "epoch": 0.44, "learning_rate": 3.0756825613744506e-06, "loss": 1.0483, "step": 14714 }, { "epoch": 0.44, "learning_rate": 3.0754451936785057e-06, "loss": 1.1028, "step": 14715 }, { "epoch": 0.44, "learning_rate": 3.0752078205046006e-06, "loss": 1.1893, "step": 14716 }, { "epoch": 0.44, "learning_rate": 3.074970441854993e-06, "loss": 1.2094, "step": 14717 }, { "epoch": 0.44, "learning_rate": 3.0747330577319444e-06, "loss": 1.1157, "step": 14718 }, { "epoch": 0.44, "learning_rate": 3.0744956681377135e-06, "loss": 1.2896, "step": 14719 }, { "epoch": 0.44, "learning_rate": 3.0742582730745606e-06, "loss": 1.1337, "step": 14720 }, { "epoch": 0.44, "learning_rate": 3.0740208725447456e-06, "loss": 1.1336, "step": 14721 }, { "epoch": 0.44, "learning_rate": 3.073783466550529e-06, "loss": 1.115, "step": 14722 }, { "epoch": 0.44, "learning_rate": 3.073546055094169e-06, "loss": 1.1548, "step": 14723 }, { "epoch": 0.44, "learning_rate": 3.0733086381779274e-06, "loss": 1.2521, "step": 14724 }, { "epoch": 0.44, "learning_rate": 3.073071215804064e-06, "loss": 1.111, "step": 14725 }, { "epoch": 0.44, "learning_rate": 3.072833787974838e-06, "loss": 1.15, "step": 14726 }, { "epoch": 0.44, "learning_rate": 3.072596354692511e-06, "loss": 1.0164, "step": 14727 }, { "epoch": 0.44, "learning_rate": 3.0723589159593416e-06, "loss": 1.0891, "step": 14728 }, { "epoch": 0.44, "learning_rate": 3.0721214717775918e-06, "loss": 1.0938, "step": 14729 }, { "epoch": 0.44, "learning_rate": 3.07188402214952e-06, "loss": 1.1459, "step": 14730 }, { "epoch": 0.44, "learning_rate": 3.0716465670773887e-06, "loss": 1.1202, "step": 14731 }, { "epoch": 0.44, "learning_rate": 3.071409106563457e-06, "loss": 1.0472, "step": 14732 }, { "epoch": 0.44, "learning_rate": 3.0711716406099857e-06, "loss": 1.1375, "step": 14733 }, { "epoch": 0.44, "learning_rate": 3.0709341692192357e-06, "loss": 1.0275, "step": 14734 }, { "epoch": 0.44, "learning_rate": 3.070696692393467e-06, "loss": 1.2274, "step": 14735 }, { "epoch": 0.44, "learning_rate": 3.0704592101349414e-06, "loss": 1.0761, "step": 14736 }, { "epoch": 0.44, "learning_rate": 3.070221722445918e-06, "loss": 1.2225, "step": 14737 }, { "epoch": 0.44, "learning_rate": 3.069984229328659e-06, "loss": 1.1825, "step": 14738 }, { "epoch": 0.44, "learning_rate": 3.0697467307854243e-06, "loss": 1.0791, "step": 14739 }, { "epoch": 0.44, "learning_rate": 3.0695092268184755e-06, "loss": 1.1956, "step": 14740 }, { "epoch": 0.44, "learning_rate": 3.0692717174300727e-06, "loss": 1.1542, "step": 14741 }, { "epoch": 0.44, "learning_rate": 3.0690342026224785e-06, "loss": 1.0583, "step": 14742 }, { "epoch": 0.44, "learning_rate": 3.0687966823979515e-06, "loss": 1.2639, "step": 14743 }, { "epoch": 0.44, "learning_rate": 3.0685591567587545e-06, "loss": 1.1705, "step": 14744 }, { "epoch": 0.44, "learning_rate": 3.068321625707148e-06, "loss": 1.0775, "step": 14745 }, { "epoch": 0.44, "learning_rate": 3.068084089245394e-06, "loss": 1.0995, "step": 14746 }, { "epoch": 0.44, "learning_rate": 3.067846547375752e-06, "loss": 1.0996, "step": 14747 }, { "epoch": 0.44, "learning_rate": 3.0676090001004845e-06, "loss": 1.1075, "step": 14748 }, { "epoch": 0.44, "learning_rate": 3.067371447421853e-06, "loss": 1.2621, "step": 14749 }, { "epoch": 0.44, "learning_rate": 3.0671338893421186e-06, "loss": 1.1689, "step": 14750 }, { "epoch": 0.44, "learning_rate": 3.0668963258635424e-06, "loss": 1.127, "step": 14751 }, { "epoch": 0.44, "learning_rate": 3.0666587569883868e-06, "loss": 1.1248, "step": 14752 }, { "epoch": 0.44, "learning_rate": 3.0664211827189124e-06, "loss": 1.0974, "step": 14753 }, { "epoch": 0.44, "learning_rate": 3.066183603057381e-06, "loss": 1.2842, "step": 14754 }, { "epoch": 0.44, "learning_rate": 3.0659460180060546e-06, "loss": 1.1293, "step": 14755 }, { "epoch": 0.44, "learning_rate": 3.0657084275671943e-06, "loss": 1.1981, "step": 14756 }, { "epoch": 0.44, "learning_rate": 3.0654708317430633e-06, "loss": 1.1049, "step": 14757 }, { "epoch": 0.44, "learning_rate": 3.065233230535921e-06, "loss": 1.1393, "step": 14758 }, { "epoch": 0.44, "learning_rate": 3.0649956239480317e-06, "loss": 1.1057, "step": 14759 }, { "epoch": 0.44, "learning_rate": 3.0647580119816554e-06, "loss": 1.2109, "step": 14760 }, { "epoch": 0.44, "learning_rate": 3.064520394639055e-06, "loss": 1.0641, "step": 14761 }, { "epoch": 0.44, "learning_rate": 3.064282771922492e-06, "loss": 1.2008, "step": 14762 }, { "epoch": 0.44, "learning_rate": 3.0640451438342294e-06, "loss": 1.1712, "step": 14763 }, { "epoch": 0.44, "learning_rate": 3.0638075103765287e-06, "loss": 1.1107, "step": 14764 }, { "epoch": 0.44, "learning_rate": 3.063569871551651e-06, "loss": 1.1293, "step": 14765 }, { "epoch": 0.44, "learning_rate": 3.063332227361861e-06, "loss": 1.0225, "step": 14766 }, { "epoch": 0.44, "learning_rate": 3.0630945778094184e-06, "loss": 1.2394, "step": 14767 }, { "epoch": 0.44, "learning_rate": 3.062856922896587e-06, "loss": 1.189, "step": 14768 }, { "epoch": 0.44, "learning_rate": 3.062619262625629e-06, "loss": 1.1292, "step": 14769 }, { "epoch": 0.44, "learning_rate": 3.0623815969988067e-06, "loss": 1.0402, "step": 14770 }, { "epoch": 0.44, "learning_rate": 3.0621439260183816e-06, "loss": 1.069, "step": 14771 }, { "epoch": 0.45, "learning_rate": 3.061906249686618e-06, "loss": 1.1075, "step": 14772 }, { "epoch": 0.45, "learning_rate": 3.0616685680057774e-06, "loss": 1.165, "step": 14773 }, { "epoch": 0.45, "learning_rate": 3.0614308809781217e-06, "loss": 1.2053, "step": 14774 }, { "epoch": 0.45, "learning_rate": 3.0611931886059156e-06, "loss": 1.1024, "step": 14775 }, { "epoch": 0.45, "learning_rate": 3.0609554908914197e-06, "loss": 1.1535, "step": 14776 }, { "epoch": 0.45, "learning_rate": 3.060717787836898e-06, "loss": 1.0752, "step": 14777 }, { "epoch": 0.45, "learning_rate": 3.0604800794446127e-06, "loss": 1.1179, "step": 14778 }, { "epoch": 0.45, "learning_rate": 3.0602423657168272e-06, "loss": 1.1052, "step": 14779 }, { "epoch": 0.45, "learning_rate": 3.0600046466558043e-06, "loss": 1.1312, "step": 14780 }, { "epoch": 0.45, "learning_rate": 3.059766922263807e-06, "loss": 1.0672, "step": 14781 }, { "epoch": 0.45, "learning_rate": 3.059529192543098e-06, "loss": 1.1547, "step": 14782 }, { "epoch": 0.45, "learning_rate": 3.059291457495941e-06, "loss": 1.1434, "step": 14783 }, { "epoch": 0.45, "learning_rate": 3.0590537171245983e-06, "loss": 1.1545, "step": 14784 }, { "epoch": 0.45, "learning_rate": 3.0588159714313336e-06, "loss": 1.1465, "step": 14785 }, { "epoch": 0.45, "learning_rate": 3.0585782204184093e-06, "loss": 1.2677, "step": 14786 }, { "epoch": 0.45, "learning_rate": 3.0583404640880904e-06, "loss": 1.1063, "step": 14787 }, { "epoch": 0.45, "learning_rate": 3.0581027024426385e-06, "loss": 1.044, "step": 14788 }, { "epoch": 0.45, "learning_rate": 3.0578649354843177e-06, "loss": 1.1429, "step": 14789 }, { "epoch": 0.45, "learning_rate": 3.0576271632153913e-06, "loss": 1.1365, "step": 14790 }, { "epoch": 0.45, "learning_rate": 3.0573893856381234e-06, "loss": 1.0804, "step": 14791 }, { "epoch": 0.45, "learning_rate": 3.0571516027547764e-06, "loss": 1.1697, "step": 14792 }, { "epoch": 0.45, "learning_rate": 3.056913814567615e-06, "loss": 1.2116, "step": 14793 }, { "epoch": 0.45, "learning_rate": 3.0566760210789024e-06, "loss": 1.1603, "step": 14794 }, { "epoch": 0.45, "learning_rate": 3.0564382222909016e-06, "loss": 1.1406, "step": 14795 }, { "epoch": 0.45, "learning_rate": 3.0562004182058774e-06, "loss": 1.0244, "step": 14796 }, { "epoch": 0.45, "learning_rate": 3.055962608826093e-06, "loss": 1.0757, "step": 14797 }, { "epoch": 0.45, "learning_rate": 3.0557247941538125e-06, "loss": 1.1399, "step": 14798 }, { "epoch": 0.45, "learning_rate": 3.055486974191299e-06, "loss": 1.0634, "step": 14799 }, { "epoch": 0.45, "learning_rate": 3.0552491489408177e-06, "loss": 0.9146, "step": 14800 }, { "epoch": 0.45, "learning_rate": 3.0550113184046316e-06, "loss": 1.1141, "step": 14801 }, { "epoch": 0.45, "learning_rate": 3.0547734825850047e-06, "loss": 1.0416, "step": 14802 }, { "epoch": 0.45, "learning_rate": 3.0545356414842015e-06, "loss": 1.1083, "step": 14803 }, { "epoch": 0.45, "learning_rate": 3.054297795104486e-06, "loss": 1.2559, "step": 14804 }, { "epoch": 0.45, "learning_rate": 3.0540599434481234e-06, "loss": 1.1813, "step": 14805 }, { "epoch": 0.45, "learning_rate": 3.0538220865173764e-06, "loss": 1.1415, "step": 14806 }, { "epoch": 0.45, "learning_rate": 3.05358422431451e-06, "loss": 1.0627, "step": 14807 }, { "epoch": 0.45, "learning_rate": 3.0533463568417878e-06, "loss": 1.1559, "step": 14808 }, { "epoch": 0.45, "learning_rate": 3.0531084841014757e-06, "loss": 1.0953, "step": 14809 }, { "epoch": 0.45, "learning_rate": 3.052870606095836e-06, "loss": 1.1125, "step": 14810 }, { "epoch": 0.45, "learning_rate": 3.052632722827136e-06, "loss": 1.0751, "step": 14811 }, { "epoch": 0.45, "learning_rate": 3.052394834297637e-06, "loss": 1.1754, "step": 14812 }, { "epoch": 0.45, "learning_rate": 3.052156940509607e-06, "loss": 1.0242, "step": 14813 }, { "epoch": 0.45, "learning_rate": 3.0519190414653073e-06, "loss": 1.1301, "step": 14814 }, { "epoch": 0.45, "learning_rate": 3.051681137167005e-06, "loss": 0.9966, "step": 14815 }, { "epoch": 0.45, "learning_rate": 3.0514432276169635e-06, "loss": 1.1392, "step": 14816 }, { "epoch": 0.45, "learning_rate": 3.051205312817448e-06, "loss": 1.1576, "step": 14817 }, { "epoch": 0.45, "learning_rate": 3.0509673927707233e-06, "loss": 1.0967, "step": 14818 }, { "epoch": 0.45, "learning_rate": 3.0507294674790544e-06, "loss": 1.1479, "step": 14819 }, { "epoch": 0.45, "learning_rate": 3.050491536944707e-06, "loss": 1.0662, "step": 14820 }, { "epoch": 0.45, "learning_rate": 3.0502536011699444e-06, "loss": 1.1151, "step": 14821 }, { "epoch": 0.45, "learning_rate": 3.0500156601570336e-06, "loss": 1.1435, "step": 14822 }, { "epoch": 0.45, "learning_rate": 3.0497777139082374e-06, "loss": 1.1257, "step": 14823 }, { "epoch": 0.45, "learning_rate": 3.049539762425823e-06, "loss": 1.0964, "step": 14824 }, { "epoch": 0.45, "learning_rate": 3.0493018057120543e-06, "loss": 1.2317, "step": 14825 }, { "epoch": 0.45, "learning_rate": 3.0490638437691974e-06, "loss": 1.2184, "step": 14826 }, { "epoch": 0.45, "learning_rate": 3.0488258765995166e-06, "loss": 1.0772, "step": 14827 }, { "epoch": 0.45, "learning_rate": 3.0485879042052785e-06, "loss": 1.0153, "step": 14828 }, { "epoch": 0.45, "learning_rate": 3.048349926588747e-06, "loss": 1.2186, "step": 14829 }, { "epoch": 0.45, "learning_rate": 3.0481119437521884e-06, "loss": 1.2355, "step": 14830 }, { "epoch": 0.45, "learning_rate": 3.0478739556978676e-06, "loss": 0.9916, "step": 14831 }, { "epoch": 0.45, "learning_rate": 3.047635962428051e-06, "loss": 1.067, "step": 14832 }, { "epoch": 0.45, "learning_rate": 3.0473979639450048e-06, "loss": 1.0667, "step": 14833 }, { "epoch": 0.45, "learning_rate": 3.047159960250992e-06, "loss": 1.0767, "step": 14834 }, { "epoch": 0.45, "learning_rate": 3.046921951348281e-06, "loss": 1.0927, "step": 14835 }, { "epoch": 0.45, "learning_rate": 3.0466839372391365e-06, "loss": 1.106, "step": 14836 }, { "epoch": 0.45, "learning_rate": 3.046445917925824e-06, "loss": 1.1881, "step": 14837 }, { "epoch": 0.45, "learning_rate": 3.0462078934106093e-06, "loss": 1.1042, "step": 14838 }, { "epoch": 0.45, "learning_rate": 3.045969863695759e-06, "loss": 1.1733, "step": 14839 }, { "epoch": 0.45, "learning_rate": 3.045731828783538e-06, "loss": 1.2003, "step": 14840 }, { "epoch": 0.45, "learning_rate": 3.0454937886762133e-06, "loss": 1.1149, "step": 14841 }, { "epoch": 0.45, "learning_rate": 3.04525574337605e-06, "loss": 1.1506, "step": 14842 }, { "epoch": 0.45, "learning_rate": 3.045017692885314e-06, "loss": 1.0517, "step": 14843 }, { "epoch": 0.45, "learning_rate": 3.044779637206273e-06, "loss": 1.0084, "step": 14844 }, { "epoch": 0.45, "learning_rate": 3.044541576341192e-06, "loss": 1.1625, "step": 14845 }, { "epoch": 0.45, "learning_rate": 3.044303510292338e-06, "loss": 1.0669, "step": 14846 }, { "epoch": 0.45, "learning_rate": 3.0440654390619756e-06, "loss": 1.1125, "step": 14847 }, { "epoch": 0.45, "learning_rate": 3.0438273626523733e-06, "loss": 1.1068, "step": 14848 }, { "epoch": 0.45, "learning_rate": 3.0435892810657958e-06, "loss": 1.0877, "step": 14849 }, { "epoch": 0.45, "learning_rate": 3.0433511943045106e-06, "loss": 1.27, "step": 14850 }, { "epoch": 0.45, "learning_rate": 3.043113102370783e-06, "loss": 1.0872, "step": 14851 }, { "epoch": 0.45, "learning_rate": 3.0428750052668814e-06, "loss": 1.0952, "step": 14852 }, { "epoch": 0.45, "learning_rate": 3.0426369029950703e-06, "loss": 1.1595, "step": 14853 }, { "epoch": 0.45, "learning_rate": 3.0423987955576177e-06, "loss": 1.1741, "step": 14854 }, { "epoch": 0.45, "learning_rate": 3.0421606829567895e-06, "loss": 1.1337, "step": 14855 }, { "epoch": 0.45, "learning_rate": 3.0419225651948524e-06, "loss": 1.176, "step": 14856 }, { "epoch": 0.45, "learning_rate": 3.041684442274074e-06, "loss": 1.1602, "step": 14857 }, { "epoch": 0.45, "learning_rate": 3.0414463141967203e-06, "loss": 1.1531, "step": 14858 }, { "epoch": 0.45, "learning_rate": 3.0412081809650583e-06, "loss": 1.1306, "step": 14859 }, { "epoch": 0.45, "learning_rate": 3.0409700425813553e-06, "loss": 1.2427, "step": 14860 }, { "epoch": 0.45, "learning_rate": 3.0407318990478783e-06, "loss": 1.2053, "step": 14861 }, { "epoch": 0.45, "learning_rate": 3.040493750366894e-06, "loss": 1.3325, "step": 14862 }, { "epoch": 0.45, "learning_rate": 3.0402555965406694e-06, "loss": 1.1187, "step": 14863 }, { "epoch": 0.45, "learning_rate": 3.0400174375714713e-06, "loss": 1.0901, "step": 14864 }, { "epoch": 0.45, "learning_rate": 3.0397792734615684e-06, "loss": 1.1011, "step": 14865 }, { "epoch": 0.45, "learning_rate": 3.0395411042132256e-06, "loss": 1.1588, "step": 14866 }, { "epoch": 0.45, "learning_rate": 3.039302929828712e-06, "loss": 1.2394, "step": 14867 }, { "epoch": 0.45, "learning_rate": 3.0390647503102937e-06, "loss": 1.2151, "step": 14868 }, { "epoch": 0.45, "learning_rate": 3.0388265656602395e-06, "loss": 1.0953, "step": 14869 }, { "epoch": 0.45, "learning_rate": 3.038588375880815e-06, "loss": 1.1587, "step": 14870 }, { "epoch": 0.45, "learning_rate": 3.0383501809742888e-06, "loss": 1.1756, "step": 14871 }, { "epoch": 0.45, "learning_rate": 3.0381119809429277e-06, "loss": 1.0594, "step": 14872 }, { "epoch": 0.45, "learning_rate": 3.037873775789e-06, "loss": 1.041, "step": 14873 }, { "epoch": 0.45, "learning_rate": 3.0376355655147738e-06, "loss": 1.1254, "step": 14874 }, { "epoch": 0.45, "learning_rate": 3.037397350122515e-06, "loss": 1.0798, "step": 14875 }, { "epoch": 0.45, "learning_rate": 3.037159129614493e-06, "loss": 1.1326, "step": 14876 }, { "epoch": 0.45, "learning_rate": 3.0369209039929744e-06, "loss": 1.2007, "step": 14877 }, { "epoch": 0.45, "learning_rate": 3.036682673260228e-06, "loss": 1.1541, "step": 14878 }, { "epoch": 0.45, "learning_rate": 3.03644443741852e-06, "loss": 1.1207, "step": 14879 }, { "epoch": 0.45, "learning_rate": 3.03620619647012e-06, "loss": 1.1224, "step": 14880 }, { "epoch": 0.45, "learning_rate": 3.0359679504172944e-06, "loss": 1.2437, "step": 14881 }, { "epoch": 0.45, "learning_rate": 3.0357296992623132e-06, "loss": 1.199, "step": 14882 }, { "epoch": 0.45, "learning_rate": 3.0354914430074424e-06, "loss": 1.0492, "step": 14883 }, { "epoch": 0.45, "learning_rate": 3.035253181654951e-06, "loss": 1.0746, "step": 14884 }, { "epoch": 0.45, "learning_rate": 3.0350149152071073e-06, "loss": 1.0243, "step": 14885 }, { "epoch": 0.45, "learning_rate": 3.034776643666179e-06, "loss": 1.1371, "step": 14886 }, { "epoch": 0.45, "learning_rate": 3.034538367034435e-06, "loss": 1.2206, "step": 14887 }, { "epoch": 0.45, "learning_rate": 3.0343000853141434e-06, "loss": 1.1569, "step": 14888 }, { "epoch": 0.45, "learning_rate": 3.0340617985075726e-06, "loss": 1.1542, "step": 14889 }, { "epoch": 0.45, "learning_rate": 3.03382350661699e-06, "loss": 1.0891, "step": 14890 }, { "epoch": 0.45, "learning_rate": 3.033585209644665e-06, "loss": 1.1248, "step": 14891 }, { "epoch": 0.45, "learning_rate": 3.0333469075928657e-06, "loss": 1.0459, "step": 14892 }, { "epoch": 0.45, "learning_rate": 3.033108600463861e-06, "loss": 1.0521, "step": 14893 }, { "epoch": 0.45, "learning_rate": 3.032870288259918e-06, "loss": 1.0944, "step": 14894 }, { "epoch": 0.45, "learning_rate": 3.032631970983308e-06, "loss": 1.0605, "step": 14895 }, { "epoch": 0.45, "learning_rate": 3.0323936486362977e-06, "loss": 1.1127, "step": 14896 }, { "epoch": 0.45, "learning_rate": 3.0321553212211556e-06, "loss": 1.0903, "step": 14897 }, { "epoch": 0.45, "learning_rate": 3.0319169887401517e-06, "loss": 1.1921, "step": 14898 }, { "epoch": 0.45, "learning_rate": 3.0316786511955544e-06, "loss": 1.015, "step": 14899 }, { "epoch": 0.45, "learning_rate": 3.0314403085896315e-06, "loss": 1.1487, "step": 14900 }, { "epoch": 0.45, "learning_rate": 3.0312019609246536e-06, "loss": 1.0677, "step": 14901 }, { "epoch": 0.45, "learning_rate": 3.0309636082028885e-06, "loss": 1.0962, "step": 14902 }, { "epoch": 0.45, "learning_rate": 3.030725250426606e-06, "loss": 1.048, "step": 14903 }, { "epoch": 0.45, "learning_rate": 3.0304868875980747e-06, "loss": 1.1287, "step": 14904 }, { "epoch": 0.45, "learning_rate": 3.0302485197195635e-06, "loss": 1.2548, "step": 14905 }, { "epoch": 0.45, "learning_rate": 3.0300101467933425e-06, "loss": 1.1954, "step": 14906 }, { "epoch": 0.45, "learning_rate": 3.029771768821679e-06, "loss": 1.0962, "step": 14907 }, { "epoch": 0.45, "learning_rate": 3.0295333858068445e-06, "loss": 1.0999, "step": 14908 }, { "epoch": 0.45, "learning_rate": 3.029294997751106e-06, "loss": 1.0826, "step": 14909 }, { "epoch": 0.45, "learning_rate": 3.0290566046567344e-06, "loss": 1.1889, "step": 14910 }, { "epoch": 0.45, "learning_rate": 3.0288182065259997e-06, "loss": 1.2178, "step": 14911 }, { "epoch": 0.45, "learning_rate": 3.028579803361169e-06, "loss": 0.9716, "step": 14912 }, { "epoch": 0.45, "learning_rate": 3.0283413951645135e-06, "loss": 1.0901, "step": 14913 }, { "epoch": 0.45, "learning_rate": 3.028102981938303e-06, "loss": 1.0308, "step": 14914 }, { "epoch": 0.45, "learning_rate": 3.027864563684806e-06, "loss": 1.0925, "step": 14915 }, { "epoch": 0.45, "learning_rate": 3.0276261404062925e-06, "loss": 1.0338, "step": 14916 }, { "epoch": 0.45, "learning_rate": 3.027387712105033e-06, "loss": 1.1744, "step": 14917 }, { "epoch": 0.45, "learning_rate": 3.027149278783296e-06, "loss": 1.3307, "step": 14918 }, { "epoch": 0.45, "learning_rate": 3.0269108404433516e-06, "loss": 1.1037, "step": 14919 }, { "epoch": 0.45, "learning_rate": 3.0266723970874696e-06, "loss": 1.1788, "step": 14920 }, { "epoch": 0.45, "learning_rate": 3.026433948717921e-06, "loss": 1.0553, "step": 14921 }, { "epoch": 0.45, "learning_rate": 3.026195495336973e-06, "loss": 1.1447, "step": 14922 }, { "epoch": 0.45, "learning_rate": 3.025957036946899e-06, "loss": 1.1297, "step": 14923 }, { "epoch": 0.45, "learning_rate": 3.0257185735499667e-06, "loss": 1.0829, "step": 14924 }, { "epoch": 0.45, "learning_rate": 3.025480105148446e-06, "loss": 1.1163, "step": 14925 }, { "epoch": 0.45, "learning_rate": 3.0252416317446087e-06, "loss": 1.1706, "step": 14926 }, { "epoch": 0.45, "learning_rate": 3.025003153340724e-06, "loss": 1.121, "step": 14927 }, { "epoch": 0.45, "learning_rate": 3.024764669939062e-06, "loss": 1.1783, "step": 14928 }, { "epoch": 0.45, "learning_rate": 3.0245261815418923e-06, "loss": 1.0968, "step": 14929 }, { "epoch": 0.45, "learning_rate": 3.024287688151488e-06, "loss": 1.0508, "step": 14930 }, { "epoch": 0.45, "learning_rate": 3.0240491897701154e-06, "loss": 1.1603, "step": 14931 }, { "epoch": 0.45, "learning_rate": 3.023810686400048e-06, "loss": 1.1132, "step": 14932 }, { "epoch": 0.45, "learning_rate": 3.0235721780435547e-06, "loss": 1.0547, "step": 14933 }, { "epoch": 0.45, "learning_rate": 3.0233336647029065e-06, "loss": 1.09, "step": 14934 }, { "epoch": 0.45, "learning_rate": 3.0230951463803736e-06, "loss": 1.0119, "step": 14935 }, { "epoch": 0.45, "learning_rate": 3.0228566230782275e-06, "loss": 1.2341, "step": 14936 }, { "epoch": 0.45, "learning_rate": 3.0226180947987375e-06, "loss": 1.2206, "step": 14937 }, { "epoch": 0.45, "learning_rate": 3.0223795615441754e-06, "loss": 1.1182, "step": 14938 }, { "epoch": 0.45, "learning_rate": 3.0221410233168107e-06, "loss": 1.1302, "step": 14939 }, { "epoch": 0.45, "learning_rate": 3.0219024801189157e-06, "loss": 1.1982, "step": 14940 }, { "epoch": 0.45, "learning_rate": 3.0216639319527604e-06, "loss": 1.1483, "step": 14941 }, { "epoch": 0.45, "learning_rate": 3.0214253788206148e-06, "loss": 1.1927, "step": 14942 }, { "epoch": 0.45, "learning_rate": 3.021186820724752e-06, "loss": 1.1354, "step": 14943 }, { "epoch": 0.45, "learning_rate": 3.020948257667441e-06, "loss": 1.0372, "step": 14944 }, { "epoch": 0.45, "learning_rate": 3.020709689650954e-06, "loss": 1.1368, "step": 14945 }, { "epoch": 0.45, "learning_rate": 3.0204711166775615e-06, "loss": 1.145, "step": 14946 }, { "epoch": 0.45, "learning_rate": 3.020232538749534e-06, "loss": 1.0741, "step": 14947 }, { "epoch": 0.45, "learning_rate": 3.019993955869144e-06, "loss": 1.1126, "step": 14948 }, { "epoch": 0.45, "learning_rate": 3.0197553680386617e-06, "loss": 1.0806, "step": 14949 }, { "epoch": 0.45, "learning_rate": 3.019516775260358e-06, "loss": 1.1036, "step": 14950 }, { "epoch": 0.45, "learning_rate": 3.0192781775365047e-06, "loss": 1.1358, "step": 14951 }, { "epoch": 0.45, "learning_rate": 3.0190395748693747e-06, "loss": 1.1465, "step": 14952 }, { "epoch": 0.45, "learning_rate": 3.018800967261237e-06, "loss": 0.9894, "step": 14953 }, { "epoch": 0.45, "learning_rate": 3.0185623547143633e-06, "loss": 1.1562, "step": 14954 }, { "epoch": 0.45, "learning_rate": 3.0183237372310265e-06, "loss": 1.1361, "step": 14955 }, { "epoch": 0.45, "learning_rate": 3.0180851148134976e-06, "loss": 1.1638, "step": 14956 }, { "epoch": 0.45, "learning_rate": 3.0178464874640473e-06, "loss": 1.1564, "step": 14957 }, { "epoch": 0.45, "learning_rate": 3.0176078551849487e-06, "loss": 1.224, "step": 14958 }, { "epoch": 0.45, "learning_rate": 3.017369217978472e-06, "loss": 1.1669, "step": 14959 }, { "epoch": 0.45, "learning_rate": 3.0171305758468893e-06, "loss": 1.047, "step": 14960 }, { "epoch": 0.45, "learning_rate": 3.0168919287924732e-06, "loss": 1.2891, "step": 14961 }, { "epoch": 0.45, "learning_rate": 3.016653276817495e-06, "loss": 1.0485, "step": 14962 }, { "epoch": 0.45, "learning_rate": 3.0164146199242254e-06, "loss": 1.0698, "step": 14963 }, { "epoch": 0.45, "learning_rate": 3.016175958114938e-06, "loss": 1.2037, "step": 14964 }, { "epoch": 0.45, "learning_rate": 3.015937291391904e-06, "loss": 1.0697, "step": 14965 }, { "epoch": 0.45, "learning_rate": 3.0156986197573956e-06, "loss": 1.0734, "step": 14966 }, { "epoch": 0.45, "learning_rate": 3.0154599432136842e-06, "loss": 1.1746, "step": 14967 }, { "epoch": 0.45, "learning_rate": 3.0152212617630427e-06, "loss": 1.1586, "step": 14968 }, { "epoch": 0.45, "learning_rate": 3.0149825754077434e-06, "loss": 1.1862, "step": 14969 }, { "epoch": 0.45, "learning_rate": 3.014743884150057e-06, "loss": 1.1271, "step": 14970 }, { "epoch": 0.45, "learning_rate": 3.0145051879922576e-06, "loss": 1.1592, "step": 14971 }, { "epoch": 0.45, "learning_rate": 3.0142664869366163e-06, "loss": 1.1242, "step": 14972 }, { "epoch": 0.45, "learning_rate": 3.014027780985406e-06, "loss": 1.1035, "step": 14973 }, { "epoch": 0.45, "learning_rate": 3.0137890701408982e-06, "loss": 1.2027, "step": 14974 }, { "epoch": 0.45, "learning_rate": 3.0135503544053666e-06, "loss": 1.1534, "step": 14975 }, { "epoch": 0.45, "learning_rate": 3.0133116337810823e-06, "loss": 1.0423, "step": 14976 }, { "epoch": 0.45, "learning_rate": 3.013072908270319e-06, "loss": 1.0829, "step": 14977 }, { "epoch": 0.45, "learning_rate": 3.012834177875349e-06, "loss": 1.2991, "step": 14978 }, { "epoch": 0.45, "learning_rate": 3.012595442598444e-06, "loss": 1.1431, "step": 14979 }, { "epoch": 0.45, "learning_rate": 3.0123567024418763e-06, "loss": 1.0403, "step": 14980 }, { "epoch": 0.45, "learning_rate": 3.012117957407921e-06, "loss": 1.1014, "step": 14981 }, { "epoch": 0.45, "learning_rate": 3.011879207498849e-06, "loss": 1.0923, "step": 14982 }, { "epoch": 0.45, "learning_rate": 3.0116404527169336e-06, "loss": 1.05, "step": 14983 }, { "epoch": 0.45, "learning_rate": 3.0114016930644475e-06, "loss": 1.0977, "step": 14984 }, { "epoch": 0.45, "learning_rate": 3.0111629285436633e-06, "loss": 1.0594, "step": 14985 }, { "epoch": 0.45, "learning_rate": 3.010924159156855e-06, "loss": 1.1941, "step": 14986 }, { "epoch": 0.45, "learning_rate": 3.010685384906294e-06, "loss": 1.1496, "step": 14987 }, { "epoch": 0.45, "learning_rate": 3.0104466057942543e-06, "loss": 1.1786, "step": 14988 }, { "epoch": 0.45, "learning_rate": 3.0102078218230084e-06, "loss": 1.1038, "step": 14989 }, { "epoch": 0.45, "learning_rate": 3.00996903299483e-06, "loss": 1.107, "step": 14990 }, { "epoch": 0.45, "learning_rate": 3.0097302393119926e-06, "loss": 1.2237, "step": 14991 }, { "epoch": 0.45, "learning_rate": 3.0094914407767678e-06, "loss": 1.2612, "step": 14992 }, { "epoch": 0.45, "learning_rate": 3.009252637391431e-06, "loss": 1.1642, "step": 14993 }, { "epoch": 0.45, "learning_rate": 3.0090138291582533e-06, "loss": 1.2562, "step": 14994 }, { "epoch": 0.45, "learning_rate": 3.008775016079509e-06, "loss": 1.1235, "step": 14995 }, { "epoch": 0.45, "learning_rate": 3.008536198157472e-06, "loss": 1.114, "step": 14996 }, { "epoch": 0.45, "learning_rate": 3.0082973753944158e-06, "loss": 1.053, "step": 14997 }, { "epoch": 0.45, "learning_rate": 3.008058547792613e-06, "loss": 1.1693, "step": 14998 }, { "epoch": 0.45, "learning_rate": 3.0078197153543375e-06, "loss": 1.0311, "step": 14999 }, { "epoch": 0.45, "learning_rate": 3.007580878081863e-06, "loss": 1.1408, "step": 15000 }, { "epoch": 0.45, "learning_rate": 3.007342035977463e-06, "loss": 1.0805, "step": 15001 }, { "epoch": 0.45, "learning_rate": 3.007103189043411e-06, "loss": 1.0815, "step": 15002 }, { "epoch": 0.45, "learning_rate": 3.0068643372819807e-06, "loss": 1.132, "step": 15003 }, { "epoch": 0.45, "learning_rate": 3.0066254806954465e-06, "loss": 1.2695, "step": 15004 }, { "epoch": 0.45, "learning_rate": 3.006386619286081e-06, "loss": 1.1483, "step": 15005 }, { "epoch": 0.45, "learning_rate": 3.00614775305616e-06, "loss": 1.1975, "step": 15006 }, { "epoch": 0.45, "learning_rate": 3.005908882007955e-06, "loss": 1.1371, "step": 15007 }, { "epoch": 0.45, "learning_rate": 3.0056700061437416e-06, "loss": 1.1133, "step": 15008 }, { "epoch": 0.45, "learning_rate": 3.0054311254657925e-06, "loss": 1.1273, "step": 15009 }, { "epoch": 0.45, "learning_rate": 3.0051922399763837e-06, "loss": 1.0631, "step": 15010 }, { "epoch": 0.45, "learning_rate": 3.004953349677787e-06, "loss": 1.1359, "step": 15011 }, { "epoch": 0.45, "learning_rate": 3.004714454572279e-06, "loss": 1.1047, "step": 15012 }, { "epoch": 0.45, "learning_rate": 3.0044755546621314e-06, "loss": 1.106, "step": 15013 }, { "epoch": 0.45, "learning_rate": 3.00423664994962e-06, "loss": 1.152, "step": 15014 }, { "epoch": 0.45, "learning_rate": 3.003997740437018e-06, "loss": 1.0988, "step": 15015 }, { "epoch": 0.45, "learning_rate": 3.0037588261266004e-06, "loss": 1.0496, "step": 15016 }, { "epoch": 0.45, "learning_rate": 3.003519907020642e-06, "loss": 1.162, "step": 15017 }, { "epoch": 0.45, "learning_rate": 3.0032809831214157e-06, "loss": 1.1252, "step": 15018 }, { "epoch": 0.45, "learning_rate": 3.003042054431198e-06, "loss": 1.0586, "step": 15019 }, { "epoch": 0.45, "learning_rate": 3.002803120952261e-06, "loss": 1.1463, "step": 15020 }, { "epoch": 0.45, "learning_rate": 3.00256418268688e-06, "loss": 1.1293, "step": 15021 }, { "epoch": 0.45, "learning_rate": 3.0023252396373315e-06, "loss": 1.0838, "step": 15022 }, { "epoch": 0.45, "learning_rate": 3.002086291805888e-06, "loss": 1.2036, "step": 15023 }, { "epoch": 0.45, "learning_rate": 3.0018473391948244e-06, "loss": 1.0673, "step": 15024 }, { "epoch": 0.45, "learning_rate": 3.001608381806417e-06, "loss": 1.1108, "step": 15025 }, { "epoch": 0.45, "learning_rate": 3.001369419642938e-06, "loss": 1.1023, "step": 15026 }, { "epoch": 0.45, "learning_rate": 3.0011304527066646e-06, "loss": 1.067, "step": 15027 }, { "epoch": 0.45, "learning_rate": 3.0008914809998707e-06, "loss": 1.0644, "step": 15028 }, { "epoch": 0.45, "learning_rate": 3.000652504524831e-06, "loss": 1.0986, "step": 15029 }, { "epoch": 0.45, "learning_rate": 3.00041352328382e-06, "loss": 1.1628, "step": 15030 }, { "epoch": 0.45, "learning_rate": 3.0001745372791134e-06, "loss": 1.2697, "step": 15031 }, { "epoch": 0.45, "learning_rate": 2.9999355465129863e-06, "loss": 1.1801, "step": 15032 }, { "epoch": 0.45, "learning_rate": 2.9996965509877135e-06, "loss": 1.1409, "step": 15033 }, { "epoch": 0.45, "learning_rate": 2.9994575507055706e-06, "loss": 1.1143, "step": 15034 }, { "epoch": 0.45, "learning_rate": 2.9992185456688323e-06, "loss": 1.0839, "step": 15035 }, { "epoch": 0.45, "learning_rate": 2.998979535879773e-06, "loss": 1.1321, "step": 15036 }, { "epoch": 0.45, "learning_rate": 2.9987405213406696e-06, "loss": 1.066, "step": 15037 }, { "epoch": 0.45, "learning_rate": 2.9985015020537967e-06, "loss": 1.1416, "step": 15038 }, { "epoch": 0.45, "learning_rate": 2.9982624780214293e-06, "loss": 1.152, "step": 15039 }, { "epoch": 0.45, "learning_rate": 2.998023449245843e-06, "loss": 1.1181, "step": 15040 }, { "epoch": 0.45, "learning_rate": 2.9977844157293134e-06, "loss": 1.1052, "step": 15041 }, { "epoch": 0.45, "learning_rate": 2.9975453774741164e-06, "loss": 1.1062, "step": 15042 }, { "epoch": 0.45, "learning_rate": 2.9973063344825267e-06, "loss": 1.1058, "step": 15043 }, { "epoch": 0.45, "learning_rate": 2.9970672867568195e-06, "loss": 1.0695, "step": 15044 }, { "epoch": 0.45, "learning_rate": 2.996828234299272e-06, "loss": 1.1589, "step": 15045 }, { "epoch": 0.45, "learning_rate": 2.9965891771121584e-06, "loss": 1.0209, "step": 15046 }, { "epoch": 0.45, "learning_rate": 2.9963501151977557e-06, "loss": 1.0857, "step": 15047 }, { "epoch": 0.45, "learning_rate": 2.996111048558339e-06, "loss": 1.0541, "step": 15048 }, { "epoch": 0.45, "learning_rate": 2.995871977196183e-06, "loss": 1.1155, "step": 15049 }, { "epoch": 0.45, "learning_rate": 2.9956329011135655e-06, "loss": 0.9796, "step": 15050 }, { "epoch": 0.45, "learning_rate": 2.995393820312761e-06, "loss": 1.1225, "step": 15051 }, { "epoch": 0.45, "learning_rate": 2.9951547347960463e-06, "loss": 1.1925, "step": 15052 }, { "epoch": 0.45, "learning_rate": 2.9949156445656968e-06, "loss": 1.043, "step": 15053 }, { "epoch": 0.45, "learning_rate": 2.9946765496239887e-06, "loss": 1.1902, "step": 15054 }, { "epoch": 0.45, "learning_rate": 2.994437449973199e-06, "loss": 1.089, "step": 15055 }, { "epoch": 0.45, "learning_rate": 2.9941983456156014e-06, "loss": 1.1725, "step": 15056 }, { "epoch": 0.45, "learning_rate": 2.993959236553474e-06, "loss": 1.0436, "step": 15057 }, { "epoch": 0.45, "learning_rate": 2.993720122789093e-06, "loss": 1.159, "step": 15058 }, { "epoch": 0.45, "learning_rate": 2.993481004324734e-06, "loss": 1.193, "step": 15059 }, { "epoch": 0.45, "learning_rate": 2.993241881162674e-06, "loss": 1.125, "step": 15060 }, { "epoch": 0.45, "learning_rate": 2.993002753305188e-06, "loss": 1.0774, "step": 15061 }, { "epoch": 0.45, "learning_rate": 2.9927636207545536e-06, "loss": 1.2726, "step": 15062 }, { "epoch": 0.45, "learning_rate": 2.9925244835130467e-06, "loss": 1.124, "step": 15063 }, { "epoch": 0.45, "learning_rate": 2.9922853415829444e-06, "loss": 1.1584, "step": 15064 }, { "epoch": 0.45, "learning_rate": 2.9920461949665217e-06, "loss": 1.1003, "step": 15065 }, { "epoch": 0.45, "learning_rate": 2.9918070436660573e-06, "loss": 1.1501, "step": 15066 }, { "epoch": 0.45, "learning_rate": 2.991567887683826e-06, "loss": 1.0919, "step": 15067 }, { "epoch": 0.45, "learning_rate": 2.9913287270221065e-06, "loss": 1.2153, "step": 15068 }, { "epoch": 0.45, "learning_rate": 2.9910895616831725e-06, "loss": 1.1077, "step": 15069 }, { "epoch": 0.45, "learning_rate": 2.9908503916693027e-06, "loss": 1.1951, "step": 15070 }, { "epoch": 0.45, "learning_rate": 2.9906112169827745e-06, "loss": 1.1134, "step": 15071 }, { "epoch": 0.45, "learning_rate": 2.9903720376258628e-06, "loss": 1.0903, "step": 15072 }, { "epoch": 0.45, "learning_rate": 2.9901328536008462e-06, "loss": 1.2823, "step": 15073 }, { "epoch": 0.45, "learning_rate": 2.9898936649100004e-06, "loss": 0.9698, "step": 15074 }, { "epoch": 0.45, "learning_rate": 2.9896544715556037e-06, "loss": 1.1346, "step": 15075 }, { "epoch": 0.45, "learning_rate": 2.9894152735399314e-06, "loss": 1.1124, "step": 15076 }, { "epoch": 0.45, "learning_rate": 2.989176070865261e-06, "loss": 1.1754, "step": 15077 }, { "epoch": 0.45, "learning_rate": 2.9889368635338708e-06, "loss": 1.1156, "step": 15078 }, { "epoch": 0.45, "learning_rate": 2.988697651548037e-06, "loss": 1.1059, "step": 15079 }, { "epoch": 0.45, "learning_rate": 2.9884584349100366e-06, "loss": 1.0761, "step": 15080 }, { "epoch": 0.45, "learning_rate": 2.9882192136221476e-06, "loss": 1.0821, "step": 15081 }, { "epoch": 0.45, "learning_rate": 2.987979987686646e-06, "loss": 1.1146, "step": 15082 }, { "epoch": 0.45, "learning_rate": 2.9877407571058102e-06, "loss": 1.0707, "step": 15083 }, { "epoch": 0.45, "learning_rate": 2.987501521881918e-06, "loss": 1.1908, "step": 15084 }, { "epoch": 0.45, "learning_rate": 2.987262282017246e-06, "loss": 1.1755, "step": 15085 }, { "epoch": 0.45, "learning_rate": 2.987023037514072e-06, "loss": 1.2018, "step": 15086 }, { "epoch": 0.45, "learning_rate": 2.986783788374672e-06, "loss": 1.1385, "step": 15087 }, { "epoch": 0.45, "learning_rate": 2.986544534601326e-06, "loss": 1.0776, "step": 15088 }, { "epoch": 0.45, "learning_rate": 2.98630527619631e-06, "loss": 1.1719, "step": 15089 }, { "epoch": 0.45, "learning_rate": 2.9860660131619014e-06, "loss": 1.2012, "step": 15090 }, { "epoch": 0.45, "learning_rate": 2.9858267455003786e-06, "loss": 1.1574, "step": 15091 }, { "epoch": 0.45, "learning_rate": 2.98558747321402e-06, "loss": 1.2179, "step": 15092 }, { "epoch": 0.45, "learning_rate": 2.9853481963051016e-06, "loss": 1.0339, "step": 15093 }, { "epoch": 0.45, "learning_rate": 2.985108914775903e-06, "loss": 1.2458, "step": 15094 }, { "epoch": 0.45, "learning_rate": 2.9848696286287004e-06, "loss": 1.0337, "step": 15095 }, { "epoch": 0.45, "learning_rate": 2.9846303378657727e-06, "loss": 1.1053, "step": 15096 }, { "epoch": 0.45, "learning_rate": 2.984391042489398e-06, "loss": 1.15, "step": 15097 }, { "epoch": 0.45, "learning_rate": 2.984151742501853e-06, "loss": 1.2087, "step": 15098 }, { "epoch": 0.45, "learning_rate": 2.9839124379054173e-06, "loss": 1.0482, "step": 15099 }, { "epoch": 0.45, "learning_rate": 2.983673128702368e-06, "loss": 1.1539, "step": 15100 }, { "epoch": 0.45, "learning_rate": 2.9834338148949836e-06, "loss": 1.095, "step": 15101 }, { "epoch": 0.45, "learning_rate": 2.9831944964855418e-06, "loss": 1.1113, "step": 15102 }, { "epoch": 0.45, "learning_rate": 2.9829551734763213e-06, "loss": 1.1276, "step": 15103 }, { "epoch": 0.46, "learning_rate": 2.9827158458696005e-06, "loss": 1.1945, "step": 15104 }, { "epoch": 0.46, "learning_rate": 2.9824765136676564e-06, "loss": 1.2107, "step": 15105 }, { "epoch": 0.46, "learning_rate": 2.9822371768727685e-06, "loss": 1.076, "step": 15106 }, { "epoch": 0.46, "learning_rate": 2.9819978354872158e-06, "loss": 1.1466, "step": 15107 }, { "epoch": 0.46, "learning_rate": 2.981758489513275e-06, "loss": 1.1135, "step": 15108 }, { "epoch": 0.46, "learning_rate": 2.9815191389532254e-06, "loss": 1.1085, "step": 15109 }, { "epoch": 0.46, "learning_rate": 2.9812797838093465e-06, "loss": 1.1205, "step": 15110 }, { "epoch": 0.46, "learning_rate": 2.981040424083915e-06, "loss": 1.1611, "step": 15111 }, { "epoch": 0.46, "learning_rate": 2.980801059779211e-06, "loss": 1.1002, "step": 15112 }, { "epoch": 0.46, "learning_rate": 2.9805616908975115e-06, "loss": 1.1718, "step": 15113 }, { "epoch": 0.46, "learning_rate": 2.980322317441097e-06, "loss": 1.1441, "step": 15114 }, { "epoch": 0.46, "learning_rate": 2.980082939412245e-06, "loss": 1.1285, "step": 15115 }, { "epoch": 0.46, "learning_rate": 2.979843556813235e-06, "loss": 1.1803, "step": 15116 }, { "epoch": 0.46, "learning_rate": 2.9796041696463446e-06, "loss": 1.1855, "step": 15117 }, { "epoch": 0.46, "learning_rate": 2.979364777913854e-06, "loss": 1.1343, "step": 15118 }, { "epoch": 0.46, "learning_rate": 2.979125381618041e-06, "loss": 1.1429, "step": 15119 }, { "epoch": 0.46, "learning_rate": 2.9788859807611865e-06, "loss": 1.184, "step": 15120 }, { "epoch": 0.46, "learning_rate": 2.978646575345567e-06, "loss": 1.1431, "step": 15121 }, { "epoch": 0.46, "learning_rate": 2.978407165373463e-06, "loss": 1.1469, "step": 15122 }, { "epoch": 0.46, "learning_rate": 2.978167750847153e-06, "loss": 1.1286, "step": 15123 }, { "epoch": 0.46, "learning_rate": 2.977928331768916e-06, "loss": 1.0958, "step": 15124 }, { "epoch": 0.46, "learning_rate": 2.977688908141032e-06, "loss": 1.2067, "step": 15125 }, { "epoch": 0.46, "learning_rate": 2.9774494799657794e-06, "loss": 1.1445, "step": 15126 }, { "epoch": 0.46, "learning_rate": 2.9772100472454386e-06, "loss": 1.1758, "step": 15127 }, { "epoch": 0.46, "learning_rate": 2.9769706099822864e-06, "loss": 1.1334, "step": 15128 }, { "epoch": 0.46, "learning_rate": 2.9767311681786047e-06, "loss": 1.0557, "step": 15129 }, { "epoch": 0.46, "learning_rate": 2.9764917218366718e-06, "loss": 1.0811, "step": 15130 }, { "epoch": 0.46, "learning_rate": 2.9762522709587672e-06, "loss": 1.1133, "step": 15131 }, { "epoch": 0.46, "learning_rate": 2.9760128155471697e-06, "loss": 1.1093, "step": 15132 }, { "epoch": 0.46, "learning_rate": 2.97577335560416e-06, "loss": 1.1517, "step": 15133 }, { "epoch": 0.46, "learning_rate": 2.9755338911320177e-06, "loss": 1.1297, "step": 15134 }, { "epoch": 0.46, "learning_rate": 2.975294422133021e-06, "loss": 1.176, "step": 15135 }, { "epoch": 0.46, "learning_rate": 2.9750549486094505e-06, "loss": 1.1808, "step": 15136 }, { "epoch": 0.46, "learning_rate": 2.974815470563585e-06, "loss": 1.1867, "step": 15137 }, { "epoch": 0.46, "learning_rate": 2.974575987997706e-06, "loss": 1.0501, "step": 15138 }, { "epoch": 0.46, "learning_rate": 2.9743365009140916e-06, "loss": 1.0901, "step": 15139 }, { "epoch": 0.46, "learning_rate": 2.974097009315023e-06, "loss": 1.2015, "step": 15140 }, { "epoch": 0.46, "learning_rate": 2.973857513202778e-06, "loss": 1.1932, "step": 15141 }, { "epoch": 0.46, "learning_rate": 2.973618012579639e-06, "loss": 1.101, "step": 15142 }, { "epoch": 0.46, "learning_rate": 2.9733785074478833e-06, "loss": 1.1694, "step": 15143 }, { "epoch": 0.46, "learning_rate": 2.9731389978097926e-06, "loss": 1.1808, "step": 15144 }, { "epoch": 0.46, "learning_rate": 2.9728994836676465e-06, "loss": 1.0845, "step": 15145 }, { "epoch": 0.46, "learning_rate": 2.9726599650237253e-06, "loss": 1.1412, "step": 15146 }, { "epoch": 0.46, "learning_rate": 2.9724204418803083e-06, "loss": 1.1999, "step": 15147 }, { "epoch": 0.46, "learning_rate": 2.972180914239677e-06, "loss": 1.0638, "step": 15148 }, { "epoch": 0.46, "learning_rate": 2.9719413821041104e-06, "loss": 1.0128, "step": 15149 }, { "epoch": 0.46, "learning_rate": 2.971701845475889e-06, "loss": 1.1255, "step": 15150 }, { "epoch": 0.46, "learning_rate": 2.9714623043572936e-06, "loss": 1.1763, "step": 15151 }, { "epoch": 0.46, "learning_rate": 2.9712227587506035e-06, "loss": 1.0789, "step": 15152 }, { "epoch": 0.46, "learning_rate": 2.970983208658101e-06, "loss": 1.1083, "step": 15153 }, { "epoch": 0.46, "learning_rate": 2.970743654082064e-06, "loss": 1.1255, "step": 15154 }, { "epoch": 0.46, "learning_rate": 2.9705040950247743e-06, "loss": 1.0857, "step": 15155 }, { "epoch": 0.46, "learning_rate": 2.9702645314885126e-06, "loss": 1.0412, "step": 15156 }, { "epoch": 0.46, "learning_rate": 2.970024963475559e-06, "loss": 1.2633, "step": 15157 }, { "epoch": 0.46, "learning_rate": 2.9697853909881936e-06, "loss": 1.1854, "step": 15158 }, { "epoch": 0.46, "learning_rate": 2.9695458140286975e-06, "loss": 1.2025, "step": 15159 }, { "epoch": 0.46, "learning_rate": 2.9693062325993515e-06, "loss": 1.0794, "step": 15160 }, { "epoch": 0.46, "learning_rate": 2.9690666467024372e-06, "loss": 1.1824, "step": 15161 }, { "epoch": 0.46, "learning_rate": 2.9688270563402334e-06, "loss": 1.1319, "step": 15162 }, { "epoch": 0.46, "learning_rate": 2.968587461515022e-06, "loss": 1.1635, "step": 15163 }, { "epoch": 0.46, "learning_rate": 2.9683478622290832e-06, "loss": 1.1707, "step": 15164 }, { "epoch": 0.46, "learning_rate": 2.9681082584846986e-06, "loss": 1.0994, "step": 15165 }, { "epoch": 0.46, "learning_rate": 2.96786865028415e-06, "loss": 1.0969, "step": 15166 }, { "epoch": 0.46, "learning_rate": 2.9676290376297156e-06, "loss": 1.1609, "step": 15167 }, { "epoch": 0.46, "learning_rate": 2.9673894205236793e-06, "loss": 1.1219, "step": 15168 }, { "epoch": 0.46, "learning_rate": 2.9671497989683195e-06, "loss": 1.0663, "step": 15169 }, { "epoch": 0.46, "learning_rate": 2.9669101729659195e-06, "loss": 1.1117, "step": 15170 }, { "epoch": 0.46, "learning_rate": 2.9666705425187594e-06, "loss": 0.9832, "step": 15171 }, { "epoch": 0.46, "learning_rate": 2.96643090762912e-06, "loss": 1.1426, "step": 15172 }, { "epoch": 0.46, "learning_rate": 2.9661912682992827e-06, "loss": 1.1407, "step": 15173 }, { "epoch": 0.46, "learning_rate": 2.96595162453153e-06, "loss": 1.3425, "step": 15174 }, { "epoch": 0.46, "learning_rate": 2.9657119763281415e-06, "loss": 1.2319, "step": 15175 }, { "epoch": 0.46, "learning_rate": 2.9654723236913994e-06, "loss": 1.1123, "step": 15176 }, { "epoch": 0.46, "learning_rate": 2.9652326666235858e-06, "loss": 1.0679, "step": 15177 }, { "epoch": 0.46, "learning_rate": 2.9649930051269803e-06, "loss": 1.081, "step": 15178 }, { "epoch": 0.46, "learning_rate": 2.9647533392038662e-06, "loss": 1.1108, "step": 15179 }, { "epoch": 0.46, "learning_rate": 2.9645136688565233e-06, "loss": 1.0342, "step": 15180 }, { "epoch": 0.46, "learning_rate": 2.964273994087235e-06, "loss": 1.1391, "step": 15181 }, { "epoch": 0.46, "learning_rate": 2.964034314898281e-06, "loss": 1.213, "step": 15182 }, { "epoch": 0.46, "learning_rate": 2.9637946312919447e-06, "loss": 1.1373, "step": 15183 }, { "epoch": 0.46, "learning_rate": 2.963554943270506e-06, "loss": 1.1082, "step": 15184 }, { "epoch": 0.46, "learning_rate": 2.9633152508362474e-06, "loss": 0.9963, "step": 15185 }, { "epoch": 0.46, "learning_rate": 2.9630755539914514e-06, "loss": 1.2848, "step": 15186 }, { "epoch": 0.46, "learning_rate": 2.9628358527383983e-06, "loss": 1.2893, "step": 15187 }, { "epoch": 0.46, "learning_rate": 2.962596147079371e-06, "loss": 1.063, "step": 15188 }, { "epoch": 0.46, "learning_rate": 2.962356437016652e-06, "loss": 1.1129, "step": 15189 }, { "epoch": 0.46, "learning_rate": 2.962116722552522e-06, "loss": 1.2816, "step": 15190 }, { "epoch": 0.46, "learning_rate": 2.961877003689263e-06, "loss": 1.0707, "step": 15191 }, { "epoch": 0.46, "learning_rate": 2.9616372804291584e-06, "loss": 1.1216, "step": 15192 }, { "epoch": 0.46, "learning_rate": 2.9613975527744877e-06, "loss": 1.2029, "step": 15193 }, { "epoch": 0.46, "learning_rate": 2.961157820727536e-06, "loss": 1.2109, "step": 15194 }, { "epoch": 0.46, "learning_rate": 2.9609180842905825e-06, "loss": 1.1562, "step": 15195 }, { "epoch": 0.46, "learning_rate": 2.960678343465912e-06, "loss": 1.1432, "step": 15196 }, { "epoch": 0.46, "learning_rate": 2.960438598255805e-06, "loss": 1.1078, "step": 15197 }, { "epoch": 0.46, "learning_rate": 2.960198848662545e-06, "loss": 1.0883, "step": 15198 }, { "epoch": 0.46, "learning_rate": 2.9599590946884126e-06, "loss": 1.1275, "step": 15199 }, { "epoch": 0.46, "learning_rate": 2.9597193363356915e-06, "loss": 1.0878, "step": 15200 }, { "epoch": 0.46, "learning_rate": 2.9594795736066633e-06, "loss": 1.1597, "step": 15201 }, { "epoch": 0.46, "learning_rate": 2.959239806503611e-06, "loss": 1.0562, "step": 15202 }, { "epoch": 0.46, "learning_rate": 2.959000035028818e-06, "loss": 1.0573, "step": 15203 }, { "epoch": 0.46, "learning_rate": 2.958760259184564e-06, "loss": 1.1648, "step": 15204 }, { "epoch": 0.46, "learning_rate": 2.9585204789731346e-06, "loss": 1.1426, "step": 15205 }, { "epoch": 0.46, "learning_rate": 2.9582806943968106e-06, "loss": 1.192, "step": 15206 }, { "epoch": 0.46, "learning_rate": 2.958040905457876e-06, "loss": 1.099, "step": 15207 }, { "epoch": 0.46, "learning_rate": 2.9578011121586112e-06, "loss": 1.1116, "step": 15208 }, { "epoch": 0.46, "learning_rate": 2.9575613145013015e-06, "loss": 1.1235, "step": 15209 }, { "epoch": 0.46, "learning_rate": 2.957321512488228e-06, "loss": 1.0884, "step": 15210 }, { "epoch": 0.46, "learning_rate": 2.9570817061216737e-06, "loss": 1.1775, "step": 15211 }, { "epoch": 0.46, "learning_rate": 2.9568418954039215e-06, "loss": 1.1732, "step": 15212 }, { "epoch": 0.46, "learning_rate": 2.9566020803372548e-06, "loss": 1.0865, "step": 15213 }, { "epoch": 0.46, "learning_rate": 2.9563622609239555e-06, "loss": 1.0753, "step": 15214 }, { "epoch": 0.46, "learning_rate": 2.956122437166309e-06, "loss": 1.2009, "step": 15215 }, { "epoch": 0.46, "learning_rate": 2.955882609066595e-06, "loss": 1.0508, "step": 15216 }, { "epoch": 0.46, "learning_rate": 2.9556427766270986e-06, "loss": 1.1472, "step": 15217 }, { "epoch": 0.46, "learning_rate": 2.955402939850103e-06, "loss": 1.1876, "step": 15218 }, { "epoch": 0.46, "learning_rate": 2.9551630987378892e-06, "loss": 1.1252, "step": 15219 }, { "epoch": 0.46, "learning_rate": 2.9549232532927437e-06, "loss": 1.2089, "step": 15220 }, { "epoch": 0.46, "learning_rate": 2.954683403516947e-06, "loss": 1.2148, "step": 15221 }, { "epoch": 0.46, "learning_rate": 2.9544435494127832e-06, "loss": 1.0824, "step": 15222 }, { "epoch": 0.46, "learning_rate": 2.9542036909825363e-06, "loss": 1.1884, "step": 15223 }, { "epoch": 0.46, "learning_rate": 2.953963828228489e-06, "loss": 1.1586, "step": 15224 }, { "epoch": 0.46, "learning_rate": 2.953723961152924e-06, "loss": 1.1826, "step": 15225 }, { "epoch": 0.46, "learning_rate": 2.9534840897581254e-06, "loss": 1.0975, "step": 15226 }, { "epoch": 0.46, "learning_rate": 2.9532442140463768e-06, "loss": 1.1537, "step": 15227 }, { "epoch": 0.46, "learning_rate": 2.9530043340199622e-06, "loss": 1.1786, "step": 15228 }, { "epoch": 0.46, "learning_rate": 2.9527644496811636e-06, "loss": 1.1565, "step": 15229 }, { "epoch": 0.46, "learning_rate": 2.9525245610322658e-06, "loss": 1.1931, "step": 15230 }, { "epoch": 0.46, "learning_rate": 2.9522846680755523e-06, "loss": 1.1738, "step": 15231 }, { "epoch": 0.46, "learning_rate": 2.9520447708133065e-06, "loss": 1.0709, "step": 15232 }, { "epoch": 0.46, "learning_rate": 2.951804869247813e-06, "loss": 1.0923, "step": 15233 }, { "epoch": 0.46, "learning_rate": 2.9515649633813536e-06, "loss": 1.1462, "step": 15234 }, { "epoch": 0.46, "learning_rate": 2.9513250532162142e-06, "loss": 1.1812, "step": 15235 }, { "epoch": 0.46, "learning_rate": 2.951085138754677e-06, "loss": 1.2095, "step": 15236 }, { "epoch": 0.46, "learning_rate": 2.9508452199990267e-06, "loss": 1.2043, "step": 15237 }, { "epoch": 0.46, "learning_rate": 2.9506052969515466e-06, "loss": 1.1269, "step": 15238 }, { "epoch": 0.46, "learning_rate": 2.9503653696145218e-06, "loss": 1.0814, "step": 15239 }, { "epoch": 0.46, "learning_rate": 2.950125437990235e-06, "loss": 1.1186, "step": 15240 }, { "epoch": 0.46, "learning_rate": 2.949885502080971e-06, "loss": 1.1948, "step": 15241 }, { "epoch": 0.46, "learning_rate": 2.9496455618890137e-06, "loss": 1.1764, "step": 15242 }, { "epoch": 0.46, "learning_rate": 2.949405617416647e-06, "loss": 1.1849, "step": 15243 }, { "epoch": 0.46, "learning_rate": 2.949165668666156e-06, "loss": 1.1064, "step": 15244 }, { "epoch": 0.46, "learning_rate": 2.9489257156398233e-06, "loss": 1.1958, "step": 15245 }, { "epoch": 0.46, "learning_rate": 2.9486857583399347e-06, "loss": 1.0884, "step": 15246 }, { "epoch": 0.46, "learning_rate": 2.948445796768773e-06, "loss": 1.1046, "step": 15247 }, { "epoch": 0.46, "learning_rate": 2.9482058309286244e-06, "loss": 1.2487, "step": 15248 }, { "epoch": 0.46, "learning_rate": 2.947965860821771e-06, "loss": 1.1517, "step": 15249 }, { "epoch": 0.46, "learning_rate": 2.9477258864504994e-06, "loss": 1.0751, "step": 15250 }, { "epoch": 0.46, "learning_rate": 2.947485907817092e-06, "loss": 1.1018, "step": 15251 }, { "epoch": 0.46, "learning_rate": 2.947245924923835e-06, "loss": 1.0518, "step": 15252 }, { "epoch": 0.46, "learning_rate": 2.947005937773012e-06, "loss": 1.1943, "step": 15253 }, { "epoch": 0.46, "learning_rate": 2.9467659463669074e-06, "loss": 1.1164, "step": 15254 }, { "epoch": 0.46, "learning_rate": 2.9465259507078057e-06, "loss": 1.0811, "step": 15255 }, { "epoch": 0.46, "learning_rate": 2.946285950797993e-06, "loss": 1.0693, "step": 15256 }, { "epoch": 0.46, "learning_rate": 2.946045946639753e-06, "loss": 1.0799, "step": 15257 }, { "epoch": 0.46, "learning_rate": 2.9458059382353697e-06, "loss": 1.0778, "step": 15258 }, { "epoch": 0.46, "learning_rate": 2.9455659255871295e-06, "loss": 1.0701, "step": 15259 }, { "epoch": 0.46, "learning_rate": 2.9453259086973156e-06, "loss": 1.1718, "step": 15260 }, { "epoch": 0.46, "learning_rate": 2.9450858875682144e-06, "loss": 1.2208, "step": 15261 }, { "epoch": 0.46, "learning_rate": 2.9448458622021087e-06, "loss": 1.2162, "step": 15262 }, { "epoch": 0.46, "learning_rate": 2.9446058326012855e-06, "loss": 1.204, "step": 15263 }, { "epoch": 0.46, "learning_rate": 2.9443657987680284e-06, "loss": 1.0222, "step": 15264 }, { "epoch": 0.46, "learning_rate": 2.9441257607046236e-06, "loss": 1.1031, "step": 15265 }, { "epoch": 0.46, "learning_rate": 2.9438857184133546e-06, "loss": 1.0738, "step": 15266 }, { "epoch": 0.46, "learning_rate": 2.943645671896508e-06, "loss": 1.2951, "step": 15267 }, { "epoch": 0.46, "learning_rate": 2.9434056211563674e-06, "loss": 1.1537, "step": 15268 }, { "epoch": 0.46, "learning_rate": 2.9431655661952198e-06, "loss": 0.9945, "step": 15269 }, { "epoch": 0.46, "learning_rate": 2.9429255070153484e-06, "loss": 1.0731, "step": 15270 }, { "epoch": 0.46, "learning_rate": 2.94268544361904e-06, "loss": 1.1155, "step": 15271 }, { "epoch": 0.46, "learning_rate": 2.9424453760085803e-06, "loss": 1.087, "step": 15272 }, { "epoch": 0.46, "learning_rate": 2.9422053041862525e-06, "loss": 1.1404, "step": 15273 }, { "epoch": 0.46, "learning_rate": 2.941965228154344e-06, "loss": 1.2064, "step": 15274 }, { "epoch": 0.46, "learning_rate": 2.9417251479151386e-06, "loss": 1.2646, "step": 15275 }, { "epoch": 0.46, "learning_rate": 2.9414850634709235e-06, "loss": 1.1467, "step": 15276 }, { "epoch": 0.46, "learning_rate": 2.9412449748239824e-06, "loss": 1.0895, "step": 15277 }, { "epoch": 0.46, "learning_rate": 2.9410048819766024e-06, "loss": 1.0745, "step": 15278 }, { "epoch": 0.46, "learning_rate": 2.940764784931067e-06, "loss": 1.0398, "step": 15279 }, { "epoch": 0.46, "learning_rate": 2.9405246836896643e-06, "loss": 1.2407, "step": 15280 }, { "epoch": 0.46, "learning_rate": 2.9402845782546785e-06, "loss": 1.1907, "step": 15281 }, { "epoch": 0.46, "learning_rate": 2.9400444686283953e-06, "loss": 1.048, "step": 15282 }, { "epoch": 0.46, "learning_rate": 2.9398043548131005e-06, "loss": 1.0909, "step": 15283 }, { "epoch": 0.46, "learning_rate": 2.9395642368110807e-06, "loss": 1.1077, "step": 15284 }, { "epoch": 0.46, "learning_rate": 2.939324114624621e-06, "loss": 1.0922, "step": 15285 }, { "epoch": 0.46, "learning_rate": 2.9390839882560067e-06, "loss": 1.1678, "step": 15286 }, { "epoch": 0.46, "learning_rate": 2.9388438577075252e-06, "loss": 1.199, "step": 15287 }, { "epoch": 0.46, "learning_rate": 2.9386037229814607e-06, "loss": 1.1561, "step": 15288 }, { "epoch": 0.46, "learning_rate": 2.9383635840801007e-06, "loss": 1.1055, "step": 15289 }, { "epoch": 0.46, "learning_rate": 2.93812344100573e-06, "loss": 0.9777, "step": 15290 }, { "epoch": 0.46, "learning_rate": 2.9378832937606357e-06, "loss": 1.157, "step": 15291 }, { "epoch": 0.46, "learning_rate": 2.9376431423471023e-06, "loss": 1.2474, "step": 15292 }, { "epoch": 0.46, "learning_rate": 2.9374029867674183e-06, "loss": 1.2162, "step": 15293 }, { "epoch": 0.46, "learning_rate": 2.9371628270238672e-06, "loss": 1.1478, "step": 15294 }, { "epoch": 0.46, "learning_rate": 2.936922663118737e-06, "loss": 1.2199, "step": 15295 }, { "epoch": 0.46, "learning_rate": 2.9366824950543138e-06, "loss": 1.0107, "step": 15296 }, { "epoch": 0.46, "learning_rate": 2.9364423228328832e-06, "loss": 1.1539, "step": 15297 }, { "epoch": 0.46, "learning_rate": 2.936202146456732e-06, "loss": 1.1076, "step": 15298 }, { "epoch": 0.46, "learning_rate": 2.9359619659281464e-06, "loss": 1.1106, "step": 15299 }, { "epoch": 0.46, "learning_rate": 2.9357217812494133e-06, "loss": 1.073, "step": 15300 }, { "epoch": 0.46, "learning_rate": 2.935481592422818e-06, "loss": 1.1857, "step": 15301 }, { "epoch": 0.46, "learning_rate": 2.9352413994506484e-06, "loss": 1.1838, "step": 15302 }, { "epoch": 0.46, "learning_rate": 2.9350012023351898e-06, "loss": 1.0374, "step": 15303 }, { "epoch": 0.46, "learning_rate": 2.9347610010787297e-06, "loss": 1.0609, "step": 15304 }, { "epoch": 0.46, "learning_rate": 2.9345207956835537e-06, "loss": 1.0557, "step": 15305 }, { "epoch": 0.46, "learning_rate": 2.9342805861519498e-06, "loss": 1.2979, "step": 15306 }, { "epoch": 0.46, "learning_rate": 2.9340403724862034e-06, "loss": 1.1713, "step": 15307 }, { "epoch": 0.46, "learning_rate": 2.9338001546886006e-06, "loss": 1.1947, "step": 15308 }, { "epoch": 0.46, "learning_rate": 2.9335599327614306e-06, "loss": 1.1198, "step": 15309 }, { "epoch": 0.46, "learning_rate": 2.9333197067069786e-06, "loss": 1.1192, "step": 15310 }, { "epoch": 0.46, "learning_rate": 2.9330794765275317e-06, "loss": 1.1532, "step": 15311 }, { "epoch": 0.46, "learning_rate": 2.932839242225376e-06, "loss": 1.105, "step": 15312 }, { "epoch": 0.46, "learning_rate": 2.9325990038028e-06, "loss": 1.1465, "step": 15313 }, { "epoch": 0.46, "learning_rate": 2.9323587612620897e-06, "loss": 1.1036, "step": 15314 }, { "epoch": 0.46, "learning_rate": 2.9321185146055327e-06, "loss": 1.1508, "step": 15315 }, { "epoch": 0.46, "learning_rate": 2.931878263835415e-06, "loss": 1.2097, "step": 15316 }, { "epoch": 0.46, "learning_rate": 2.931638008954024e-06, "loss": 1.1707, "step": 15317 }, { "epoch": 0.46, "learning_rate": 2.9313977499636476e-06, "loss": 1.2238, "step": 15318 }, { "epoch": 0.46, "learning_rate": 2.9311574868665724e-06, "loss": 1.1213, "step": 15319 }, { "epoch": 0.46, "learning_rate": 2.930917219665085e-06, "loss": 1.0572, "step": 15320 }, { "epoch": 0.46, "learning_rate": 2.930676948361474e-06, "loss": 1.0863, "step": 15321 }, { "epoch": 0.46, "learning_rate": 2.930436672958025e-06, "loss": 1.1154, "step": 15322 }, { "epoch": 0.46, "learning_rate": 2.9301963934570266e-06, "loss": 1.129, "step": 15323 }, { "epoch": 0.46, "learning_rate": 2.9299561098607653e-06, "loss": 1.0925, "step": 15324 }, { "epoch": 0.46, "learning_rate": 2.929715822171529e-06, "loss": 1.1025, "step": 15325 }, { "epoch": 0.46, "learning_rate": 2.9294755303916054e-06, "loss": 1.1542, "step": 15326 }, { "epoch": 0.46, "learning_rate": 2.9292352345232817e-06, "loss": 1.01, "step": 15327 }, { "epoch": 0.46, "learning_rate": 2.928994934568845e-06, "loss": 1.1523, "step": 15328 }, { "epoch": 0.46, "learning_rate": 2.928754630530583e-06, "loss": 1.1139, "step": 15329 }, { "epoch": 0.46, "learning_rate": 2.9285143224107844e-06, "loss": 1.1403, "step": 15330 }, { "epoch": 0.46, "learning_rate": 2.9282740102117345e-06, "loss": 1.2197, "step": 15331 }, { "epoch": 0.46, "learning_rate": 2.9280336939357235e-06, "loss": 1.0397, "step": 15332 }, { "epoch": 0.46, "learning_rate": 2.9277933735850365e-06, "loss": 1.0361, "step": 15333 }, { "epoch": 0.46, "learning_rate": 2.927553049161964e-06, "loss": 1.0681, "step": 15334 }, { "epoch": 0.46, "learning_rate": 2.9273127206687917e-06, "loss": 1.0795, "step": 15335 }, { "epoch": 0.46, "learning_rate": 2.927072388107808e-06, "loss": 1.0115, "step": 15336 }, { "epoch": 0.46, "learning_rate": 2.926832051481301e-06, "loss": 1.16, "step": 15337 }, { "epoch": 0.46, "learning_rate": 2.9265917107915576e-06, "loss": 1.1026, "step": 15338 }, { "epoch": 0.46, "learning_rate": 2.926351366040868e-06, "loss": 1.1342, "step": 15339 }, { "epoch": 0.46, "learning_rate": 2.9261110172315177e-06, "loss": 1.0918, "step": 15340 }, { "epoch": 0.46, "learning_rate": 2.925870664365797e-06, "loss": 1.0782, "step": 15341 }, { "epoch": 0.46, "learning_rate": 2.925630307445991e-06, "loss": 1.087, "step": 15342 }, { "epoch": 0.46, "learning_rate": 2.925389946474391e-06, "loss": 1.1384, "step": 15343 }, { "epoch": 0.46, "learning_rate": 2.925149581453283e-06, "loss": 1.1616, "step": 15344 }, { "epoch": 0.46, "learning_rate": 2.9249092123849554e-06, "loss": 1.1396, "step": 15345 }, { "epoch": 0.46, "learning_rate": 2.924668839271697e-06, "loss": 1.0593, "step": 15346 }, { "epoch": 0.46, "learning_rate": 2.9244284621157958e-06, "loss": 1.1718, "step": 15347 }, { "epoch": 0.46, "learning_rate": 2.92418808091954e-06, "loss": 1.1968, "step": 15348 }, { "epoch": 0.46, "learning_rate": 2.923947695685218e-06, "loss": 1.1286, "step": 15349 }, { "epoch": 0.46, "learning_rate": 2.923707306415118e-06, "loss": 1.1546, "step": 15350 }, { "epoch": 0.46, "learning_rate": 2.923466913111529e-06, "loss": 1.1969, "step": 15351 }, { "epoch": 0.46, "learning_rate": 2.923226515776738e-06, "loss": 1.0616, "step": 15352 }, { "epoch": 0.46, "learning_rate": 2.9229861144130345e-06, "loss": 1.1492, "step": 15353 }, { "epoch": 0.46, "learning_rate": 2.9227457090227078e-06, "loss": 1.2054, "step": 15354 }, { "epoch": 0.46, "learning_rate": 2.922505299608045e-06, "loss": 1.1171, "step": 15355 }, { "epoch": 0.46, "learning_rate": 2.922264886171336e-06, "loss": 1.1785, "step": 15356 }, { "epoch": 0.46, "learning_rate": 2.9220244687148674e-06, "loss": 1.1501, "step": 15357 }, { "epoch": 0.46, "learning_rate": 2.9217840472409304e-06, "loss": 1.1006, "step": 15358 }, { "epoch": 0.46, "learning_rate": 2.9215436217518113e-06, "loss": 1.098, "step": 15359 }, { "epoch": 0.46, "learning_rate": 2.921303192249801e-06, "loss": 1.2128, "step": 15360 }, { "epoch": 0.46, "learning_rate": 2.921062758737186e-06, "loss": 1.191, "step": 15361 }, { "epoch": 0.46, "learning_rate": 2.920822321216257e-06, "loss": 1.1768, "step": 15362 }, { "epoch": 0.46, "learning_rate": 2.920581879689302e-06, "loss": 1.1646, "step": 15363 }, { "epoch": 0.46, "learning_rate": 2.92034143415861e-06, "loss": 1.1682, "step": 15364 }, { "epoch": 0.46, "learning_rate": 2.9201009846264698e-06, "loss": 1.1083, "step": 15365 }, { "epoch": 0.46, "learning_rate": 2.919860531095171e-06, "loss": 1.0498, "step": 15366 }, { "epoch": 0.46, "learning_rate": 2.919620073567002e-06, "loss": 1.0893, "step": 15367 }, { "epoch": 0.46, "learning_rate": 2.919379612044252e-06, "loss": 1.1752, "step": 15368 }, { "epoch": 0.46, "learning_rate": 2.9191391465292106e-06, "loss": 1.1844, "step": 15369 }, { "epoch": 0.46, "learning_rate": 2.9188986770241657e-06, "loss": 1.1494, "step": 15370 }, { "epoch": 0.46, "learning_rate": 2.9186582035314075e-06, "loss": 1.1038, "step": 15371 }, { "epoch": 0.46, "learning_rate": 2.918417726053224e-06, "loss": 1.1061, "step": 15372 }, { "epoch": 0.46, "learning_rate": 2.9181772445919065e-06, "loss": 1.1005, "step": 15373 }, { "epoch": 0.46, "learning_rate": 2.917936759149743e-06, "loss": 1.1454, "step": 15374 }, { "epoch": 0.46, "learning_rate": 2.9176962697290217e-06, "loss": 0.9883, "step": 15375 }, { "epoch": 0.46, "learning_rate": 2.9174557763320336e-06, "loss": 1.0516, "step": 15376 }, { "epoch": 0.46, "learning_rate": 2.9172152789610677e-06, "loss": 1.1109, "step": 15377 }, { "epoch": 0.46, "learning_rate": 2.9169747776184133e-06, "loss": 1.1054, "step": 15378 }, { "epoch": 0.46, "learning_rate": 2.9167342723063597e-06, "loss": 1.2042, "step": 15379 }, { "epoch": 0.46, "learning_rate": 2.916493763027197e-06, "loss": 1.1685, "step": 15380 }, { "epoch": 0.46, "learning_rate": 2.916253249783213e-06, "loss": 1.2239, "step": 15381 }, { "epoch": 0.46, "learning_rate": 2.9160127325767e-06, "loss": 1.2192, "step": 15382 }, { "epoch": 0.46, "learning_rate": 2.915772211409945e-06, "loss": 1.0214, "step": 15383 }, { "epoch": 0.46, "learning_rate": 2.9155316862852403e-06, "loss": 1.1834, "step": 15384 }, { "epoch": 0.46, "learning_rate": 2.9152911572048726e-06, "loss": 1.1339, "step": 15385 }, { "epoch": 0.46, "learning_rate": 2.915050624171134e-06, "loss": 1.2709, "step": 15386 }, { "epoch": 0.46, "learning_rate": 2.914810087186313e-06, "loss": 1.4092, "step": 15387 }, { "epoch": 0.46, "learning_rate": 2.914569546252699e-06, "loss": 1.0567, "step": 15388 }, { "epoch": 0.46, "learning_rate": 2.914329001372584e-06, "loss": 1.1176, "step": 15389 }, { "epoch": 0.46, "learning_rate": 2.9140884525482554e-06, "loss": 1.2012, "step": 15390 }, { "epoch": 0.46, "learning_rate": 2.9138478997820043e-06, "loss": 1.1285, "step": 15391 }, { "epoch": 0.46, "learning_rate": 2.913607343076121e-06, "loss": 1.0853, "step": 15392 }, { "epoch": 0.46, "learning_rate": 2.9133667824328947e-06, "loss": 1.1532, "step": 15393 }, { "epoch": 0.46, "learning_rate": 2.9131262178546154e-06, "loss": 1.1221, "step": 15394 }, { "epoch": 0.46, "learning_rate": 2.9128856493435744e-06, "loss": 1.1426, "step": 15395 }, { "epoch": 0.46, "learning_rate": 2.91264507690206e-06, "loss": 1.1436, "step": 15396 }, { "epoch": 0.46, "learning_rate": 2.9124045005323637e-06, "loss": 1.2122, "step": 15397 }, { "epoch": 0.46, "learning_rate": 2.9121639202367748e-06, "loss": 1.027, "step": 15398 }, { "epoch": 0.46, "learning_rate": 2.911923336017584e-06, "loss": 1.0868, "step": 15399 }, { "epoch": 0.46, "learning_rate": 2.9116827478770816e-06, "loss": 1.1002, "step": 15400 }, { "epoch": 0.46, "learning_rate": 2.911442155817558e-06, "loss": 1.1552, "step": 15401 }, { "epoch": 0.46, "learning_rate": 2.9112015598413024e-06, "loss": 1.1176, "step": 15402 }, { "epoch": 0.46, "learning_rate": 2.910960959950606e-06, "loss": 1.1057, "step": 15403 }, { "epoch": 0.46, "learning_rate": 2.9107203561477603e-06, "loss": 1.108, "step": 15404 }, { "epoch": 0.46, "learning_rate": 2.910479748435054e-06, "loss": 1.2258, "step": 15405 }, { "epoch": 0.46, "learning_rate": 2.9102391368147777e-06, "loss": 1.2386, "step": 15406 }, { "epoch": 0.46, "learning_rate": 2.9099985212892225e-06, "loss": 1.1736, "step": 15407 }, { "epoch": 0.46, "learning_rate": 2.9097579018606792e-06, "loss": 1.0826, "step": 15408 }, { "epoch": 0.46, "learning_rate": 2.909517278531438e-06, "loss": 1.1401, "step": 15409 }, { "epoch": 0.46, "learning_rate": 2.90927665130379e-06, "loss": 1.0833, "step": 15410 }, { "epoch": 0.46, "learning_rate": 2.9090360201800244e-06, "loss": 1.1562, "step": 15411 }, { "epoch": 0.46, "learning_rate": 2.908795385162434e-06, "loss": 1.2131, "step": 15412 }, { "epoch": 0.46, "learning_rate": 2.9085547462533077e-06, "loss": 0.9659, "step": 15413 }, { "epoch": 0.46, "learning_rate": 2.9083141034549374e-06, "loss": 1.0551, "step": 15414 }, { "epoch": 0.46, "learning_rate": 2.908073456769613e-06, "loss": 0.9518, "step": 15415 }, { "epoch": 0.46, "learning_rate": 2.9078328061996255e-06, "loss": 1.1272, "step": 15416 }, { "epoch": 0.46, "learning_rate": 2.907592151747267e-06, "loss": 1.0624, "step": 15417 }, { "epoch": 0.46, "learning_rate": 2.9073514934148268e-06, "loss": 1.1208, "step": 15418 }, { "epoch": 0.46, "learning_rate": 2.907110831204597e-06, "loss": 1.1256, "step": 15419 }, { "epoch": 0.46, "learning_rate": 2.9068701651188673e-06, "loss": 1.1167, "step": 15420 }, { "epoch": 0.46, "learning_rate": 2.906629495159931e-06, "loss": 1.1276, "step": 15421 }, { "epoch": 0.46, "learning_rate": 2.9063888213300767e-06, "loss": 1.205, "step": 15422 }, { "epoch": 0.46, "learning_rate": 2.9061481436315976e-06, "loss": 1.1494, "step": 15423 }, { "epoch": 0.46, "learning_rate": 2.9059074620667828e-06, "loss": 1.1948, "step": 15424 }, { "epoch": 0.46, "learning_rate": 2.905666776637925e-06, "loss": 1.1508, "step": 15425 }, { "epoch": 0.46, "learning_rate": 2.9054260873473145e-06, "loss": 1.1298, "step": 15426 }, { "epoch": 0.46, "learning_rate": 2.905185394197243e-06, "loss": 1.1162, "step": 15427 }, { "epoch": 0.46, "learning_rate": 2.904944697190002e-06, "loss": 1.1188, "step": 15428 }, { "epoch": 0.46, "learning_rate": 2.904703996327882e-06, "loss": 1.1188, "step": 15429 }, { "epoch": 0.46, "learning_rate": 2.9044632916131754e-06, "loss": 1.0731, "step": 15430 }, { "epoch": 0.46, "learning_rate": 2.9042225830481724e-06, "loss": 1.2458, "step": 15431 }, { "epoch": 0.46, "learning_rate": 2.903981870635165e-06, "loss": 1.2482, "step": 15432 }, { "epoch": 0.46, "learning_rate": 2.903741154376446e-06, "loss": 1.1992, "step": 15433 }, { "epoch": 0.46, "learning_rate": 2.9035004342743043e-06, "loss": 1.1049, "step": 15434 }, { "epoch": 0.46, "learning_rate": 2.9032597103310336e-06, "loss": 1.1496, "step": 15435 }, { "epoch": 0.47, "learning_rate": 2.903018982548924e-06, "loss": 1.1624, "step": 15436 }, { "epoch": 0.47, "learning_rate": 2.9027782509302684e-06, "loss": 1.1592, "step": 15437 }, { "epoch": 0.47, "learning_rate": 2.9025375154773577e-06, "loss": 1.1997, "step": 15438 }, { "epoch": 0.47, "learning_rate": 2.9022967761924835e-06, "loss": 1.0994, "step": 15439 }, { "epoch": 0.47, "learning_rate": 2.9020560330779387e-06, "loss": 1.0758, "step": 15440 }, { "epoch": 0.47, "learning_rate": 2.901815286136013e-06, "loss": 1.1151, "step": 15441 }, { "epoch": 0.47, "learning_rate": 2.9015745353689993e-06, "loss": 1.1336, "step": 15442 }, { "epoch": 0.47, "learning_rate": 2.90133378077919e-06, "loss": 1.1876, "step": 15443 }, { "epoch": 0.47, "learning_rate": 2.901093022368876e-06, "loss": 1.0344, "step": 15444 }, { "epoch": 0.47, "learning_rate": 2.90085226014035e-06, "loss": 1.2045, "step": 15445 }, { "epoch": 0.47, "learning_rate": 2.900611494095903e-06, "loss": 1.1277, "step": 15446 }, { "epoch": 0.47, "learning_rate": 2.9003707242378277e-06, "loss": 1.0372, "step": 15447 }, { "epoch": 0.47, "learning_rate": 2.900129950568416e-06, "loss": 1.1934, "step": 15448 }, { "epoch": 0.47, "learning_rate": 2.8998891730899604e-06, "loss": 1.0757, "step": 15449 }, { "epoch": 0.47, "learning_rate": 2.8996483918047512e-06, "loss": 1.0126, "step": 15450 }, { "epoch": 0.47, "learning_rate": 2.8994076067150834e-06, "loss": 1.1448, "step": 15451 }, { "epoch": 0.47, "learning_rate": 2.899166817823246e-06, "loss": 1.2203, "step": 15452 }, { "epoch": 0.47, "learning_rate": 2.8989260251315342e-06, "loss": 1.2487, "step": 15453 }, { "epoch": 0.47, "learning_rate": 2.898685228642238e-06, "loss": 1.1958, "step": 15454 }, { "epoch": 0.47, "learning_rate": 2.89844442835765e-06, "loss": 1.1293, "step": 15455 }, { "epoch": 0.47, "learning_rate": 2.898203624280064e-06, "loss": 1.1465, "step": 15456 }, { "epoch": 0.47, "learning_rate": 2.89796281641177e-06, "loss": 1.067, "step": 15457 }, { "epoch": 0.47, "learning_rate": 2.8977220047550625e-06, "loss": 1.0596, "step": 15458 }, { "epoch": 0.47, "learning_rate": 2.897481189312233e-06, "loss": 1.0548, "step": 15459 }, { "epoch": 0.47, "learning_rate": 2.8972403700855733e-06, "loss": 1.0717, "step": 15460 }, { "epoch": 0.47, "learning_rate": 2.896999547077377e-06, "loss": 1.1292, "step": 15461 }, { "epoch": 0.47, "learning_rate": 2.8967587202899374e-06, "loss": 1.2329, "step": 15462 }, { "epoch": 0.47, "learning_rate": 2.896517889725544e-06, "loss": 1.0721, "step": 15463 }, { "epoch": 0.47, "learning_rate": 2.8962770553864927e-06, "loss": 1.1569, "step": 15464 }, { "epoch": 0.47, "learning_rate": 2.896036217275074e-06, "loss": 1.1213, "step": 15465 }, { "epoch": 0.47, "learning_rate": 2.895795375393582e-06, "loss": 1.1948, "step": 15466 }, { "epoch": 0.47, "learning_rate": 2.8955545297443077e-06, "loss": 1.0972, "step": 15467 }, { "epoch": 0.47, "learning_rate": 2.8953136803295446e-06, "loss": 1.2265, "step": 15468 }, { "epoch": 0.47, "learning_rate": 2.8950728271515865e-06, "loss": 0.9622, "step": 15469 }, { "epoch": 0.47, "learning_rate": 2.8948319702127246e-06, "loss": 1.1498, "step": 15470 }, { "epoch": 0.47, "learning_rate": 2.8945911095152536e-06, "loss": 1.0801, "step": 15471 }, { "epoch": 0.47, "learning_rate": 2.894350245061464e-06, "loss": 1.0844, "step": 15472 }, { "epoch": 0.47, "learning_rate": 2.894109376853651e-06, "loss": 1.2139, "step": 15473 }, { "epoch": 0.47, "learning_rate": 2.8938685048941056e-06, "loss": 1.1483, "step": 15474 }, { "epoch": 0.47, "learning_rate": 2.8936276291851227e-06, "loss": 1.0436, "step": 15475 }, { "epoch": 0.47, "learning_rate": 2.8933867497289936e-06, "loss": 1.1721, "step": 15476 }, { "epoch": 0.47, "learning_rate": 2.893145866528013e-06, "loss": 1.0829, "step": 15477 }, { "epoch": 0.47, "learning_rate": 2.892904979584472e-06, "loss": 1.1601, "step": 15478 }, { "epoch": 0.47, "learning_rate": 2.892664088900666e-06, "loss": 1.134, "step": 15479 }, { "epoch": 0.47, "learning_rate": 2.8924231944788863e-06, "loss": 1.0319, "step": 15480 }, { "epoch": 0.47, "learning_rate": 2.8921822963214263e-06, "loss": 1.0905, "step": 15481 }, { "epoch": 0.47, "learning_rate": 2.89194139443058e-06, "loss": 1.1843, "step": 15482 }, { "epoch": 0.47, "learning_rate": 2.891700488808641e-06, "loss": 1.1782, "step": 15483 }, { "epoch": 0.47, "learning_rate": 2.8914595794579016e-06, "loss": 1.0302, "step": 15484 }, { "epoch": 0.47, "learning_rate": 2.891218666380655e-06, "loss": 1.1299, "step": 15485 }, { "epoch": 0.47, "learning_rate": 2.8909777495791965e-06, "loss": 1.151, "step": 15486 }, { "epoch": 0.47, "learning_rate": 2.8907368290558167e-06, "loss": 1.2505, "step": 15487 }, { "epoch": 0.47, "learning_rate": 2.890495904812811e-06, "loss": 1.1427, "step": 15488 }, { "epoch": 0.47, "learning_rate": 2.8902549768524724e-06, "loss": 1.1201, "step": 15489 }, { "epoch": 0.47, "learning_rate": 2.8900140451770946e-06, "loss": 1.0848, "step": 15490 }, { "epoch": 0.47, "learning_rate": 2.88977310978897e-06, "loss": 1.1512, "step": 15491 }, { "epoch": 0.47, "learning_rate": 2.8895321706903946e-06, "loss": 1.1475, "step": 15492 }, { "epoch": 0.47, "learning_rate": 2.88929122788366e-06, "loss": 1.0983, "step": 15493 }, { "epoch": 0.47, "learning_rate": 2.88905028137106e-06, "loss": 1.105, "step": 15494 }, { "epoch": 0.47, "learning_rate": 2.8888093311548887e-06, "loss": 1.1317, "step": 15495 }, { "epoch": 0.47, "learning_rate": 2.88856837723744e-06, "loss": 1.1132, "step": 15496 }, { "epoch": 0.47, "learning_rate": 2.8883274196210077e-06, "loss": 1.1471, "step": 15497 }, { "epoch": 0.47, "learning_rate": 2.8880864583078848e-06, "loss": 1.149, "step": 15498 }, { "epoch": 0.47, "learning_rate": 2.8878454933003662e-06, "loss": 1.1446, "step": 15499 }, { "epoch": 0.47, "learning_rate": 2.8876045246007454e-06, "loss": 1.0942, "step": 15500 }, { "epoch": 0.47, "learning_rate": 2.8873635522113157e-06, "loss": 1.0443, "step": 15501 }, { "epoch": 0.47, "learning_rate": 2.887122576134372e-06, "loss": 0.9877, "step": 15502 }, { "epoch": 0.47, "learning_rate": 2.8868815963722074e-06, "loss": 1.2141, "step": 15503 }, { "epoch": 0.47, "learning_rate": 2.886640612927117e-06, "loss": 1.1041, "step": 15504 }, { "epoch": 0.47, "learning_rate": 2.8863996258013938e-06, "loss": 1.1407, "step": 15505 }, { "epoch": 0.47, "learning_rate": 2.886158634997332e-06, "loss": 1.2051, "step": 15506 }, { "epoch": 0.47, "learning_rate": 2.885917640517226e-06, "loss": 1.0466, "step": 15507 }, { "epoch": 0.47, "learning_rate": 2.8856766423633703e-06, "loss": 1.1061, "step": 15508 }, { "epoch": 0.47, "learning_rate": 2.8854356405380587e-06, "loss": 1.2193, "step": 15509 }, { "epoch": 0.47, "learning_rate": 2.8851946350435854e-06, "loss": 1.09, "step": 15510 }, { "epoch": 0.47, "learning_rate": 2.8849536258822442e-06, "loss": 1.1592, "step": 15511 }, { "epoch": 0.47, "learning_rate": 2.8847126130563307e-06, "loss": 1.1537, "step": 15512 }, { "epoch": 0.47, "learning_rate": 2.884471596568138e-06, "loss": 1.0901, "step": 15513 }, { "epoch": 0.47, "learning_rate": 2.88423057641996e-06, "loss": 1.0948, "step": 15514 }, { "epoch": 0.47, "learning_rate": 2.8839895526140926e-06, "loss": 1.1092, "step": 15515 }, { "epoch": 0.47, "learning_rate": 2.8837485251528303e-06, "loss": 1.1887, "step": 15516 }, { "epoch": 0.47, "learning_rate": 2.883507494038466e-06, "loss": 1.0682, "step": 15517 }, { "epoch": 0.47, "learning_rate": 2.883266459273296e-06, "loss": 1.1047, "step": 15518 }, { "epoch": 0.47, "learning_rate": 2.883025420859613e-06, "loss": 1.1804, "step": 15519 }, { "epoch": 0.47, "learning_rate": 2.8827843787997135e-06, "loss": 1.1248, "step": 15520 }, { "epoch": 0.47, "learning_rate": 2.8825433330958895e-06, "loss": 1.1284, "step": 15521 }, { "epoch": 0.47, "learning_rate": 2.8823022837504384e-06, "loss": 1.0198, "step": 15522 }, { "epoch": 0.47, "learning_rate": 2.882061230765653e-06, "loss": 1.219, "step": 15523 }, { "epoch": 0.47, "learning_rate": 2.881820174143829e-06, "loss": 1.223, "step": 15524 }, { "epoch": 0.47, "learning_rate": 2.881579113887261e-06, "loss": 1.2468, "step": 15525 }, { "epoch": 0.47, "learning_rate": 2.8813380499982437e-06, "loss": 1.0466, "step": 15526 }, { "epoch": 0.47, "learning_rate": 2.8810969824790718e-06, "loss": 1.1426, "step": 15527 }, { "epoch": 0.47, "learning_rate": 2.88085591133204e-06, "loss": 1.1066, "step": 15528 }, { "epoch": 0.47, "learning_rate": 2.880614836559443e-06, "loss": 1.1606, "step": 15529 }, { "epoch": 0.47, "learning_rate": 2.880373758163576e-06, "loss": 1.1298, "step": 15530 }, { "epoch": 0.47, "learning_rate": 2.8801326761467346e-06, "loss": 1.0627, "step": 15531 }, { "epoch": 0.47, "learning_rate": 2.879891590511213e-06, "loss": 1.093, "step": 15532 }, { "epoch": 0.47, "learning_rate": 2.879650501259307e-06, "loss": 1.1445, "step": 15533 }, { "epoch": 0.47, "learning_rate": 2.87940940839331e-06, "loss": 1.0542, "step": 15534 }, { "epoch": 0.47, "learning_rate": 2.8791683119155183e-06, "loss": 1.082, "step": 15535 }, { "epoch": 0.47, "learning_rate": 2.8789272118282273e-06, "loss": 1.1683, "step": 15536 }, { "epoch": 0.47, "learning_rate": 2.8786861081337313e-06, "loss": 1.2582, "step": 15537 }, { "epoch": 0.47, "learning_rate": 2.8784450008343266e-06, "loss": 1.0462, "step": 15538 }, { "epoch": 0.47, "learning_rate": 2.878203889932308e-06, "loss": 1.1447, "step": 15539 }, { "epoch": 0.47, "learning_rate": 2.87796277542997e-06, "loss": 1.0589, "step": 15540 }, { "epoch": 0.47, "learning_rate": 2.877721657329608e-06, "loss": 1.0918, "step": 15541 }, { "epoch": 0.47, "learning_rate": 2.8774805356335177e-06, "loss": 1.2114, "step": 15542 }, { "epoch": 0.47, "learning_rate": 2.877239410343995e-06, "loss": 1.081, "step": 15543 }, { "epoch": 0.47, "learning_rate": 2.8769982814633352e-06, "loss": 1.0557, "step": 15544 }, { "epoch": 0.47, "learning_rate": 2.8767571489938324e-06, "loss": 1.1317, "step": 15545 }, { "epoch": 0.47, "learning_rate": 2.876516012937784e-06, "loss": 1.1727, "step": 15546 }, { "epoch": 0.47, "learning_rate": 2.8762748732974836e-06, "loss": 1.0241, "step": 15547 }, { "epoch": 0.47, "learning_rate": 2.8760337300752278e-06, "loss": 1.1697, "step": 15548 }, { "epoch": 0.47, "learning_rate": 2.8757925832733125e-06, "loss": 1.2377, "step": 15549 }, { "epoch": 0.47, "learning_rate": 2.875551432894032e-06, "loss": 1.2383, "step": 15550 }, { "epoch": 0.47, "learning_rate": 2.8753102789396836e-06, "loss": 1.0278, "step": 15551 }, { "epoch": 0.47, "learning_rate": 2.8750691214125613e-06, "loss": 1.1058, "step": 15552 }, { "epoch": 0.47, "learning_rate": 2.8748279603149626e-06, "loss": 1.0067, "step": 15553 }, { "epoch": 0.47, "learning_rate": 2.8745867956491813e-06, "loss": 1.1114, "step": 15554 }, { "epoch": 0.47, "learning_rate": 2.874345627417514e-06, "loss": 1.1281, "step": 15555 }, { "epoch": 0.47, "learning_rate": 2.874104455622257e-06, "loss": 1.0629, "step": 15556 }, { "epoch": 0.47, "learning_rate": 2.873863280265706e-06, "loss": 1.1688, "step": 15557 }, { "epoch": 0.47, "learning_rate": 2.8736221013501566e-06, "loss": 1.1263, "step": 15558 }, { "epoch": 0.47, "learning_rate": 2.873380918877905e-06, "loss": 1.2072, "step": 15559 }, { "epoch": 0.47, "learning_rate": 2.8731397328512463e-06, "loss": 1.2432, "step": 15560 }, { "epoch": 0.47, "learning_rate": 2.8728985432724765e-06, "loss": 1.1444, "step": 15561 }, { "epoch": 0.47, "learning_rate": 2.8726573501438937e-06, "loss": 1.2194, "step": 15562 }, { "epoch": 0.47, "learning_rate": 2.872416153467791e-06, "loss": 1.0408, "step": 15563 }, { "epoch": 0.47, "learning_rate": 2.872174953246467e-06, "loss": 1.247, "step": 15564 }, { "epoch": 0.47, "learning_rate": 2.8719337494822158e-06, "loss": 1.0413, "step": 15565 }, { "epoch": 0.47, "learning_rate": 2.871692542177335e-06, "loss": 1.2166, "step": 15566 }, { "epoch": 0.47, "learning_rate": 2.8714513313341203e-06, "loss": 1.0969, "step": 15567 }, { "epoch": 0.47, "learning_rate": 2.871210116954868e-06, "loss": 1.2177, "step": 15568 }, { "epoch": 0.47, "learning_rate": 2.870968899041873e-06, "loss": 1.1101, "step": 15569 }, { "epoch": 0.47, "learning_rate": 2.8707276775974337e-06, "loss": 1.0975, "step": 15570 }, { "epoch": 0.47, "learning_rate": 2.8704864526238447e-06, "loss": 1.1304, "step": 15571 }, { "epoch": 0.47, "learning_rate": 2.8702452241234036e-06, "loss": 1.1483, "step": 15572 }, { "epoch": 0.47, "learning_rate": 2.8700039920984063e-06, "loss": 1.105, "step": 15573 }, { "epoch": 0.47, "learning_rate": 2.8697627565511487e-06, "loss": 1.1235, "step": 15574 }, { "epoch": 0.47, "learning_rate": 2.869521517483929e-06, "loss": 1.2334, "step": 15575 }, { "epoch": 0.47, "learning_rate": 2.869280274899041e-06, "loss": 1.0373, "step": 15576 }, { "epoch": 0.47, "learning_rate": 2.8690390287987835e-06, "loss": 1.1134, "step": 15577 }, { "epoch": 0.47, "learning_rate": 2.868797779185452e-06, "loss": 1.0865, "step": 15578 }, { "epoch": 0.47, "learning_rate": 2.8685565260613434e-06, "loss": 1.1311, "step": 15579 }, { "epoch": 0.47, "learning_rate": 2.868315269428754e-06, "loss": 1.0549, "step": 15580 }, { "epoch": 0.47, "learning_rate": 2.8680740092899806e-06, "loss": 1.2762, "step": 15581 }, { "epoch": 0.47, "learning_rate": 2.86783274564732e-06, "loss": 1.1279, "step": 15582 }, { "epoch": 0.47, "learning_rate": 2.867591478503068e-06, "loss": 0.9926, "step": 15583 }, { "epoch": 0.47, "learning_rate": 2.8673502078595235e-06, "loss": 1.0461, "step": 15584 }, { "epoch": 0.47, "learning_rate": 2.867108933718981e-06, "loss": 1.1714, "step": 15585 }, { "epoch": 0.47, "learning_rate": 2.866867656083739e-06, "loss": 1.0934, "step": 15586 }, { "epoch": 0.47, "learning_rate": 2.866626374956093e-06, "loss": 1.2943, "step": 15587 }, { "epoch": 0.47, "learning_rate": 2.8663850903383407e-06, "loss": 1.0835, "step": 15588 }, { "epoch": 0.47, "learning_rate": 2.8661438022327785e-06, "loss": 1.1624, "step": 15589 }, { "epoch": 0.47, "learning_rate": 2.8659025106417045e-06, "loss": 0.9821, "step": 15590 }, { "epoch": 0.47, "learning_rate": 2.865661215567414e-06, "loss": 1.0766, "step": 15591 }, { "epoch": 0.47, "learning_rate": 2.8654199170122056e-06, "loss": 1.0657, "step": 15592 }, { "epoch": 0.47, "learning_rate": 2.8651786149783746e-06, "loss": 1.1094, "step": 15593 }, { "epoch": 0.47, "learning_rate": 2.86493730946822e-06, "loss": 1.0826, "step": 15594 }, { "epoch": 0.47, "learning_rate": 2.8646960004840367e-06, "loss": 1.1003, "step": 15595 }, { "epoch": 0.47, "learning_rate": 2.8644546880281243e-06, "loss": 1.0663, "step": 15596 }, { "epoch": 0.47, "learning_rate": 2.864213372102778e-06, "loss": 0.964, "step": 15597 }, { "epoch": 0.47, "learning_rate": 2.8639720527102967e-06, "loss": 1.2181, "step": 15598 }, { "epoch": 0.47, "learning_rate": 2.863730729852976e-06, "loss": 1.1063, "step": 15599 }, { "epoch": 0.47, "learning_rate": 2.8634894035331145e-06, "loss": 1.2817, "step": 15600 }, { "epoch": 0.47, "learning_rate": 2.8632480737530082e-06, "loss": 1.1011, "step": 15601 }, { "epoch": 0.47, "learning_rate": 2.863006740514955e-06, "loss": 1.1407, "step": 15602 }, { "epoch": 0.47, "learning_rate": 2.862765403821254e-06, "loss": 1.1599, "step": 15603 }, { "epoch": 0.47, "learning_rate": 2.8625240636742004e-06, "loss": 1.0958, "step": 15604 }, { "epoch": 0.47, "learning_rate": 2.8622827200760916e-06, "loss": 1.1354, "step": 15605 }, { "epoch": 0.47, "learning_rate": 2.8620413730292264e-06, "loss": 1.2686, "step": 15606 }, { "epoch": 0.47, "learning_rate": 2.8618000225359022e-06, "loss": 1.1317, "step": 15607 }, { "epoch": 0.47, "learning_rate": 2.8615586685984146e-06, "loss": 1.2047, "step": 15608 }, { "epoch": 0.47, "learning_rate": 2.861317311219064e-06, "loss": 1.0989, "step": 15609 }, { "epoch": 0.47, "learning_rate": 2.861075950400146e-06, "loss": 1.1967, "step": 15610 }, { "epoch": 0.47, "learning_rate": 2.8608345861439584e-06, "loss": 1.1412, "step": 15611 }, { "epoch": 0.47, "learning_rate": 2.8605932184527996e-06, "loss": 1.1491, "step": 15612 }, { "epoch": 0.47, "learning_rate": 2.8603518473289678e-06, "loss": 1.2304, "step": 15613 }, { "epoch": 0.47, "learning_rate": 2.860110472774759e-06, "loss": 1.0798, "step": 15614 }, { "epoch": 0.47, "learning_rate": 2.8598690947924716e-06, "loss": 1.1926, "step": 15615 }, { "epoch": 0.47, "learning_rate": 2.8596277133844053e-06, "loss": 1.1512, "step": 15616 }, { "epoch": 0.47, "learning_rate": 2.859386328552855e-06, "loss": 1.2949, "step": 15617 }, { "epoch": 0.47, "learning_rate": 2.859144940300121e-06, "loss": 1.2212, "step": 15618 }, { "epoch": 0.47, "learning_rate": 2.8589035486284993e-06, "loss": 1.173, "step": 15619 }, { "epoch": 0.47, "learning_rate": 2.8586621535402894e-06, "loss": 1.1373, "step": 15620 }, { "epoch": 0.47, "learning_rate": 2.858420755037788e-06, "loss": 0.9487, "step": 15621 }, { "epoch": 0.47, "learning_rate": 2.8581793531232937e-06, "loss": 1.0055, "step": 15622 }, { "epoch": 0.47, "learning_rate": 2.8579379477991043e-06, "loss": 1.1744, "step": 15623 }, { "epoch": 0.47, "learning_rate": 2.8576965390675183e-06, "loss": 1.162, "step": 15624 }, { "epoch": 0.47, "learning_rate": 2.857455126930833e-06, "loss": 1.1237, "step": 15625 }, { "epoch": 0.47, "learning_rate": 2.8572137113913477e-06, "loss": 1.0577, "step": 15626 }, { "epoch": 0.47, "learning_rate": 2.85697229245136e-06, "loss": 1.1014, "step": 15627 }, { "epoch": 0.47, "learning_rate": 2.8567308701131675e-06, "loss": 1.074, "step": 15628 }, { "epoch": 0.47, "learning_rate": 2.856489444379069e-06, "loss": 1.1333, "step": 15629 }, { "epoch": 0.47, "learning_rate": 2.8562480152513626e-06, "loss": 1.1923, "step": 15630 }, { "epoch": 0.47, "learning_rate": 2.8560065827323474e-06, "loss": 1.2382, "step": 15631 }, { "epoch": 0.47, "learning_rate": 2.8557651468243204e-06, "loss": 1.0582, "step": 15632 }, { "epoch": 0.47, "learning_rate": 2.8555237075295804e-06, "loss": 1.1489, "step": 15633 }, { "epoch": 0.47, "learning_rate": 2.855282264850426e-06, "loss": 1.1724, "step": 15634 }, { "epoch": 0.47, "learning_rate": 2.8550408187891567e-06, "loss": 1.1995, "step": 15635 }, { "epoch": 0.47, "learning_rate": 2.854799369348068e-06, "loss": 1.1514, "step": 15636 }, { "epoch": 0.47, "learning_rate": 2.854557916529461e-06, "loss": 1.1815, "step": 15637 }, { "epoch": 0.47, "learning_rate": 2.8543164603356333e-06, "loss": 1.0981, "step": 15638 }, { "epoch": 0.47, "learning_rate": 2.854075000768884e-06, "loss": 1.1769, "step": 15639 }, { "epoch": 0.47, "learning_rate": 2.8538335378315103e-06, "loss": 1.0524, "step": 15640 }, { "epoch": 0.47, "learning_rate": 2.853592071525812e-06, "loss": 1.1013, "step": 15641 }, { "epoch": 0.47, "learning_rate": 2.853350601854088e-06, "loss": 1.1372, "step": 15642 }, { "epoch": 0.47, "learning_rate": 2.8531091288186365e-06, "loss": 1.1807, "step": 15643 }, { "epoch": 0.47, "learning_rate": 2.8528676524217557e-06, "loss": 1.1328, "step": 15644 }, { "epoch": 0.47, "learning_rate": 2.852626172665745e-06, "loss": 1.1471, "step": 15645 }, { "epoch": 0.47, "learning_rate": 2.8523846895529027e-06, "loss": 1.153, "step": 15646 }, { "epoch": 0.47, "learning_rate": 2.852143203085528e-06, "loss": 1.174, "step": 15647 }, { "epoch": 0.47, "learning_rate": 2.8519017132659204e-06, "loss": 1.0992, "step": 15648 }, { "epoch": 0.47, "learning_rate": 2.8516602200963765e-06, "loss": 1.0385, "step": 15649 }, { "epoch": 0.47, "learning_rate": 2.851418723579198e-06, "loss": 1.1651, "step": 15650 }, { "epoch": 0.47, "learning_rate": 2.8511772237166818e-06, "loss": 1.038, "step": 15651 }, { "epoch": 0.47, "learning_rate": 2.8509357205111277e-06, "loss": 1.0757, "step": 15652 }, { "epoch": 0.47, "learning_rate": 2.8506942139648342e-06, "loss": 1.0245, "step": 15653 }, { "epoch": 0.47, "learning_rate": 2.8504527040801005e-06, "loss": 1.1276, "step": 15654 }, { "epoch": 0.47, "learning_rate": 2.850211190859227e-06, "loss": 1.1207, "step": 15655 }, { "epoch": 0.47, "learning_rate": 2.8499696743045106e-06, "loss": 1.1945, "step": 15656 }, { "epoch": 0.47, "learning_rate": 2.849728154418252e-06, "loss": 1.2106, "step": 15657 }, { "epoch": 0.47, "learning_rate": 2.8494866312027495e-06, "loss": 1.1016, "step": 15658 }, { "epoch": 0.47, "learning_rate": 2.849245104660303e-06, "loss": 1.1637, "step": 15659 }, { "epoch": 0.47, "learning_rate": 2.849003574793211e-06, "loss": 1.1389, "step": 15660 }, { "epoch": 0.47, "learning_rate": 2.8487620416037735e-06, "loss": 1.0972, "step": 15661 }, { "epoch": 0.47, "learning_rate": 2.848520505094289e-06, "loss": 1.1602, "step": 15662 }, { "epoch": 0.47, "learning_rate": 2.8482789652670574e-06, "loss": 1.2797, "step": 15663 }, { "epoch": 0.47, "learning_rate": 2.848037422124377e-06, "loss": 1.1127, "step": 15664 }, { "epoch": 0.47, "learning_rate": 2.847795875668548e-06, "loss": 1.1205, "step": 15665 }, { "epoch": 0.47, "learning_rate": 2.84755432590187e-06, "loss": 1.1664, "step": 15666 }, { "epoch": 0.47, "learning_rate": 2.8473127728266427e-06, "loss": 1.2198, "step": 15667 }, { "epoch": 0.47, "learning_rate": 2.8470712164451645e-06, "loss": 1.183, "step": 15668 }, { "epoch": 0.47, "learning_rate": 2.846829656759736e-06, "loss": 1.2456, "step": 15669 }, { "epoch": 0.47, "learning_rate": 2.8465880937726566e-06, "loss": 1.0652, "step": 15670 }, { "epoch": 0.47, "learning_rate": 2.846346527486224e-06, "loss": 1.1077, "step": 15671 }, { "epoch": 0.47, "learning_rate": 2.8461049579027404e-06, "loss": 1.0833, "step": 15672 }, { "epoch": 0.47, "learning_rate": 2.8458633850245036e-06, "loss": 1.1633, "step": 15673 }, { "epoch": 0.47, "learning_rate": 2.845621808853815e-06, "loss": 1.2062, "step": 15674 }, { "epoch": 0.47, "learning_rate": 2.845380229392972e-06, "loss": 1.1697, "step": 15675 }, { "epoch": 0.47, "learning_rate": 2.8451386466442773e-06, "loss": 1.1102, "step": 15676 }, { "epoch": 0.47, "learning_rate": 2.8448970606100268e-06, "loss": 1.1168, "step": 15677 }, { "epoch": 0.47, "learning_rate": 2.8446554712925232e-06, "loss": 1.0455, "step": 15678 }, { "epoch": 0.47, "learning_rate": 2.8444138786940655e-06, "loss": 1.1006, "step": 15679 }, { "epoch": 0.47, "learning_rate": 2.8441722828169542e-06, "loss": 1.194, "step": 15680 }, { "epoch": 0.47, "learning_rate": 2.8439306836634877e-06, "loss": 1.1567, "step": 15681 }, { "epoch": 0.47, "learning_rate": 2.843689081235967e-06, "loss": 1.1198, "step": 15682 }, { "epoch": 0.47, "learning_rate": 2.843447475536692e-06, "loss": 1.1751, "step": 15683 }, { "epoch": 0.47, "learning_rate": 2.843205866567962e-06, "loss": 1.1116, "step": 15684 }, { "epoch": 0.47, "learning_rate": 2.842964254332078e-06, "loss": 1.0313, "step": 15685 }, { "epoch": 0.47, "learning_rate": 2.8427226388313388e-06, "loss": 1.1708, "step": 15686 }, { "epoch": 0.47, "learning_rate": 2.8424810200680465e-06, "loss": 1.1591, "step": 15687 }, { "epoch": 0.47, "learning_rate": 2.8422393980444985e-06, "loss": 1.1716, "step": 15688 }, { "epoch": 0.47, "learning_rate": 2.8419977727629967e-06, "loss": 1.1936, "step": 15689 }, { "epoch": 0.47, "learning_rate": 2.8417561442258408e-06, "loss": 1.0726, "step": 15690 }, { "epoch": 0.47, "learning_rate": 2.8415145124353313e-06, "loss": 1.1803, "step": 15691 }, { "epoch": 0.47, "learning_rate": 2.841272877393767e-06, "loss": 1.1077, "step": 15692 }, { "epoch": 0.47, "learning_rate": 2.84103123910345e-06, "loss": 1.1981, "step": 15693 }, { "epoch": 0.47, "learning_rate": 2.8407895975666793e-06, "loss": 1.0876, "step": 15694 }, { "epoch": 0.47, "learning_rate": 2.8405479527857565e-06, "loss": 1.1046, "step": 15695 }, { "epoch": 0.47, "learning_rate": 2.8403063047629816e-06, "loss": 1.0863, "step": 15696 }, { "epoch": 0.47, "learning_rate": 2.8400646535006538e-06, "loss": 1.1383, "step": 15697 }, { "epoch": 0.47, "learning_rate": 2.8398229990010745e-06, "loss": 1.1161, "step": 15698 }, { "epoch": 0.47, "learning_rate": 2.8395813412665433e-06, "loss": 1.2491, "step": 15699 }, { "epoch": 0.47, "learning_rate": 2.8393396802993626e-06, "loss": 1.2007, "step": 15700 }, { "epoch": 0.47, "learning_rate": 2.8390980161018304e-06, "loss": 1.1821, "step": 15701 }, { "epoch": 0.47, "learning_rate": 2.838856348676249e-06, "loss": 1.0787, "step": 15702 }, { "epoch": 0.47, "learning_rate": 2.8386146780249183e-06, "loss": 1.1014, "step": 15703 }, { "epoch": 0.47, "learning_rate": 2.8383730041501397e-06, "loss": 1.3087, "step": 15704 }, { "epoch": 0.47, "learning_rate": 2.8381313270542116e-06, "loss": 1.2269, "step": 15705 }, { "epoch": 0.47, "learning_rate": 2.8378896467394368e-06, "loss": 1.2182, "step": 15706 }, { "epoch": 0.47, "learning_rate": 2.837647963208115e-06, "loss": 1.015, "step": 15707 }, { "epoch": 0.47, "learning_rate": 2.837406276462547e-06, "loss": 1.1423, "step": 15708 }, { "epoch": 0.47, "learning_rate": 2.8371645865050347e-06, "loss": 1.0801, "step": 15709 }, { "epoch": 0.47, "learning_rate": 2.8369228933378766e-06, "loss": 1.0839, "step": 15710 }, { "epoch": 0.47, "learning_rate": 2.836681196963376e-06, "loss": 1.1504, "step": 15711 }, { "epoch": 0.47, "learning_rate": 2.8364394973838322e-06, "loss": 1.0372, "step": 15712 }, { "epoch": 0.47, "learning_rate": 2.8361977946015466e-06, "loss": 1.1924, "step": 15713 }, { "epoch": 0.47, "learning_rate": 2.83595608861882e-06, "loss": 1.1296, "step": 15714 }, { "epoch": 0.47, "learning_rate": 2.8357143794379533e-06, "loss": 1.1696, "step": 15715 }, { "epoch": 0.47, "learning_rate": 2.8354726670612463e-06, "loss": 1.1274, "step": 15716 }, { "epoch": 0.47, "learning_rate": 2.8352309514910027e-06, "loss": 1.1025, "step": 15717 }, { "epoch": 0.47, "learning_rate": 2.834989232729521e-06, "loss": 1.1508, "step": 15718 }, { "epoch": 0.47, "learning_rate": 2.834747510779103e-06, "loss": 1.1436, "step": 15719 }, { "epoch": 0.47, "learning_rate": 2.8345057856420495e-06, "loss": 1.0414, "step": 15720 }, { "epoch": 0.47, "learning_rate": 2.834264057320663e-06, "loss": 1.0894, "step": 15721 }, { "epoch": 0.47, "learning_rate": 2.8340223258172427e-06, "loss": 0.9772, "step": 15722 }, { "epoch": 0.47, "learning_rate": 2.8337805911340915e-06, "loss": 1.1258, "step": 15723 }, { "epoch": 0.47, "learning_rate": 2.8335388532735098e-06, "loss": 1.1698, "step": 15724 }, { "epoch": 0.47, "learning_rate": 2.8332971122377983e-06, "loss": 1.1793, "step": 15725 }, { "epoch": 0.47, "learning_rate": 2.83305536802926e-06, "loss": 1.1547, "step": 15726 }, { "epoch": 0.47, "learning_rate": 2.832813620650194e-06, "loss": 1.1132, "step": 15727 }, { "epoch": 0.47, "learning_rate": 2.832571870102903e-06, "loss": 1.1866, "step": 15728 }, { "epoch": 0.47, "learning_rate": 2.8323301163896876e-06, "loss": 1.094, "step": 15729 }, { "epoch": 0.47, "learning_rate": 2.8320883595128503e-06, "loss": 1.1392, "step": 15730 }, { "epoch": 0.47, "learning_rate": 2.8318465994746907e-06, "loss": 1.1655, "step": 15731 }, { "epoch": 0.47, "learning_rate": 2.8316048362775124e-06, "loss": 1.0966, "step": 15732 }, { "epoch": 0.47, "learning_rate": 2.831363069923615e-06, "loss": 1.0826, "step": 15733 }, { "epoch": 0.47, "learning_rate": 2.8311213004153003e-06, "loss": 0.9972, "step": 15734 }, { "epoch": 0.47, "learning_rate": 2.8308795277548705e-06, "loss": 1.1285, "step": 15735 }, { "epoch": 0.47, "learning_rate": 2.8306377519446275e-06, "loss": 1.2134, "step": 15736 }, { "epoch": 0.47, "learning_rate": 2.8303959729868724e-06, "loss": 1.0726, "step": 15737 }, { "epoch": 0.47, "learning_rate": 2.8301541908839065e-06, "loss": 1.1449, "step": 15738 }, { "epoch": 0.47, "learning_rate": 2.8299124056380324e-06, "loss": 1.1572, "step": 15739 }, { "epoch": 0.47, "learning_rate": 2.82967061725155e-06, "loss": 1.0914, "step": 15740 }, { "epoch": 0.47, "learning_rate": 2.8294288257267626e-06, "loss": 1.1031, "step": 15741 }, { "epoch": 0.47, "learning_rate": 2.829187031065971e-06, "loss": 1.1276, "step": 15742 }, { "epoch": 0.47, "learning_rate": 2.8289452332714785e-06, "loss": 1.1263, "step": 15743 }, { "epoch": 0.47, "learning_rate": 2.8287034323455847e-06, "loss": 1.064, "step": 15744 }, { "epoch": 0.47, "learning_rate": 2.8284616282905935e-06, "loss": 1.0815, "step": 15745 }, { "epoch": 0.47, "learning_rate": 2.8282198211088053e-06, "loss": 1.0972, "step": 15746 }, { "epoch": 0.47, "learning_rate": 2.8279780108025217e-06, "loss": 1.1523, "step": 15747 }, { "epoch": 0.47, "learning_rate": 2.8277361973740463e-06, "loss": 1.0793, "step": 15748 }, { "epoch": 0.47, "learning_rate": 2.8274943808256792e-06, "loss": 1.1396, "step": 15749 }, { "epoch": 0.47, "learning_rate": 2.8272525611597248e-06, "loss": 1.0883, "step": 15750 }, { "epoch": 0.47, "learning_rate": 2.8270107383784827e-06, "loss": 1.0867, "step": 15751 }, { "epoch": 0.47, "learning_rate": 2.826768912484256e-06, "loss": 1.166, "step": 15752 }, { "epoch": 0.47, "learning_rate": 2.8265270834793466e-06, "loss": 1.0722, "step": 15753 }, { "epoch": 0.47, "learning_rate": 2.8262852513660575e-06, "loss": 1.1102, "step": 15754 }, { "epoch": 0.47, "learning_rate": 2.826043416146689e-06, "loss": 1.1786, "step": 15755 }, { "epoch": 0.47, "learning_rate": 2.825801577823545e-06, "loss": 1.1751, "step": 15756 }, { "epoch": 0.47, "learning_rate": 2.8255597363989256e-06, "loss": 1.0936, "step": 15757 }, { "epoch": 0.47, "learning_rate": 2.8253178918751355e-06, "loss": 1.1324, "step": 15758 }, { "epoch": 0.47, "learning_rate": 2.825076044254475e-06, "loss": 1.1893, "step": 15759 }, { "epoch": 0.47, "learning_rate": 2.824834193539247e-06, "loss": 1.058, "step": 15760 }, { "epoch": 0.47, "learning_rate": 2.824592339731754e-06, "loss": 1.2367, "step": 15761 }, { "epoch": 0.47, "learning_rate": 2.8243504828342984e-06, "loss": 1.1476, "step": 15762 }, { "epoch": 0.47, "learning_rate": 2.824108622849183e-06, "loss": 1.0305, "step": 15763 }, { "epoch": 0.47, "learning_rate": 2.823866759778709e-06, "loss": 1.1476, "step": 15764 }, { "epoch": 0.47, "learning_rate": 2.8236248936251797e-06, "loss": 1.1052, "step": 15765 }, { "epoch": 0.47, "learning_rate": 2.823383024390897e-06, "loss": 1.1506, "step": 15766 }, { "epoch": 0.47, "learning_rate": 2.823141152078164e-06, "loss": 1.2333, "step": 15767 }, { "epoch": 0.48, "learning_rate": 2.822899276689283e-06, "loss": 1.2029, "step": 15768 }, { "epoch": 0.48, "learning_rate": 2.822657398226556e-06, "loss": 1.1074, "step": 15769 }, { "epoch": 0.48, "learning_rate": 2.8224155166922858e-06, "loss": 1.2382, "step": 15770 }, { "epoch": 0.48, "learning_rate": 2.822173632088776e-06, "loss": 1.0911, "step": 15771 }, { "epoch": 0.48, "learning_rate": 2.8219317444183275e-06, "loss": 1.1519, "step": 15772 }, { "epoch": 0.48, "learning_rate": 2.821689853683244e-06, "loss": 1.0919, "step": 15773 }, { "epoch": 0.48, "learning_rate": 2.821447959885828e-06, "loss": 1.186, "step": 15774 }, { "epoch": 0.48, "learning_rate": 2.8212060630283822e-06, "loss": 1.0684, "step": 15775 }, { "epoch": 0.48, "learning_rate": 2.8209641631132096e-06, "loss": 1.2028, "step": 15776 }, { "epoch": 0.48, "learning_rate": 2.8207222601426126e-06, "loss": 1.1364, "step": 15777 }, { "epoch": 0.48, "learning_rate": 2.8204803541188947e-06, "loss": 1.1792, "step": 15778 }, { "epoch": 0.48, "learning_rate": 2.820238445044357e-06, "loss": 1.2966, "step": 15779 }, { "epoch": 0.48, "learning_rate": 2.819996532921305e-06, "loss": 1.0896, "step": 15780 }, { "epoch": 0.48, "learning_rate": 2.819754617752039e-06, "loss": 1.098, "step": 15781 }, { "epoch": 0.48, "learning_rate": 2.819512699538864e-06, "loss": 1.0439, "step": 15782 }, { "epoch": 0.48, "learning_rate": 2.8192707782840812e-06, "loss": 1.1871, "step": 15783 }, { "epoch": 0.48, "learning_rate": 2.8190288539899947e-06, "loss": 1.1107, "step": 15784 }, { "epoch": 0.48, "learning_rate": 2.8187869266589067e-06, "loss": 1.1133, "step": 15785 }, { "epoch": 0.48, "learning_rate": 2.8185449962931216e-06, "loss": 1.1372, "step": 15786 }, { "epoch": 0.48, "learning_rate": 2.8183030628949408e-06, "loss": 1.2356, "step": 15787 }, { "epoch": 0.48, "learning_rate": 2.818061126466668e-06, "loss": 1.1266, "step": 15788 }, { "epoch": 0.48, "learning_rate": 2.8178191870106063e-06, "loss": 1.1439, "step": 15789 }, { "epoch": 0.48, "learning_rate": 2.8175772445290593e-06, "loss": 1.0853, "step": 15790 }, { "epoch": 0.48, "learning_rate": 2.817335299024331e-06, "loss": 1.0125, "step": 15791 }, { "epoch": 0.48, "learning_rate": 2.817093350498722e-06, "loss": 1.3207, "step": 15792 }, { "epoch": 0.48, "learning_rate": 2.8168513989545377e-06, "loss": 1.1824, "step": 15793 }, { "epoch": 0.48, "learning_rate": 2.8166094443940806e-06, "loss": 1.0826, "step": 15794 }, { "epoch": 0.48, "learning_rate": 2.8163674868196546e-06, "loss": 1.1281, "step": 15795 }, { "epoch": 0.48, "learning_rate": 2.8161255262335614e-06, "loss": 1.1685, "step": 15796 }, { "epoch": 0.48, "learning_rate": 2.8158835626381066e-06, "loss": 1.1527, "step": 15797 }, { "epoch": 0.48, "learning_rate": 2.8156415960355914e-06, "loss": 1.0707, "step": 15798 }, { "epoch": 0.48, "learning_rate": 2.8153996264283207e-06, "loss": 1.0466, "step": 15799 }, { "epoch": 0.48, "learning_rate": 2.815157653818597e-06, "loss": 1.1263, "step": 15800 }, { "epoch": 0.48, "learning_rate": 2.8149156782087244e-06, "loss": 1.2389, "step": 15801 }, { "epoch": 0.48, "learning_rate": 2.8146736996010066e-06, "loss": 1.033, "step": 15802 }, { "epoch": 0.48, "learning_rate": 2.814431717997746e-06, "loss": 1.0972, "step": 15803 }, { "epoch": 0.48, "learning_rate": 2.814189733401248e-06, "loss": 1.1805, "step": 15804 }, { "epoch": 0.48, "learning_rate": 2.813947745813814e-06, "loss": 1.196, "step": 15805 }, { "epoch": 0.48, "learning_rate": 2.8137057552377495e-06, "loss": 1.0582, "step": 15806 }, { "epoch": 0.48, "learning_rate": 2.8134637616753567e-06, "loss": 1.1791, "step": 15807 }, { "epoch": 0.48, "learning_rate": 2.8132217651289405e-06, "loss": 1.145, "step": 15808 }, { "epoch": 0.48, "learning_rate": 2.8129797656008036e-06, "loss": 1.1486, "step": 15809 }, { "epoch": 0.48, "learning_rate": 2.81273776309325e-06, "loss": 1.1284, "step": 15810 }, { "epoch": 0.48, "learning_rate": 2.8124957576085834e-06, "loss": 1.082, "step": 15811 }, { "epoch": 0.48, "learning_rate": 2.8122537491491083e-06, "loss": 1.0887, "step": 15812 }, { "epoch": 0.48, "learning_rate": 2.812011737717127e-06, "loss": 1.1171, "step": 15813 }, { "epoch": 0.48, "learning_rate": 2.8117697233149445e-06, "loss": 1.1827, "step": 15814 }, { "epoch": 0.48, "learning_rate": 2.811527705944865e-06, "loss": 0.9893, "step": 15815 }, { "epoch": 0.48, "learning_rate": 2.811285685609191e-06, "loss": 1.1826, "step": 15816 }, { "epoch": 0.48, "learning_rate": 2.811043662310227e-06, "loss": 1.2837, "step": 15817 }, { "epoch": 0.48, "learning_rate": 2.8108016360502776e-06, "loss": 1.2025, "step": 15818 }, { "epoch": 0.48, "learning_rate": 2.8105596068316466e-06, "loss": 1.1143, "step": 15819 }, { "epoch": 0.48, "learning_rate": 2.8103175746566373e-06, "loss": 1.1549, "step": 15820 }, { "epoch": 0.48, "learning_rate": 2.810075539527555e-06, "loss": 1.0789, "step": 15821 }, { "epoch": 0.48, "learning_rate": 2.8098335014467015e-06, "loss": 1.1497, "step": 15822 }, { "epoch": 0.48, "learning_rate": 2.8095914604163833e-06, "loss": 1.0611, "step": 15823 }, { "epoch": 0.48, "learning_rate": 2.809349416438903e-06, "loss": 1.1604, "step": 15824 }, { "epoch": 0.48, "learning_rate": 2.809107369516566e-06, "loss": 1.1637, "step": 15825 }, { "epoch": 0.48, "learning_rate": 2.8088653196516745e-06, "loss": 1.0883, "step": 15826 }, { "epoch": 0.48, "learning_rate": 2.8086232668465345e-06, "loss": 1.0762, "step": 15827 }, { "epoch": 0.48, "learning_rate": 2.8083812111034505e-06, "loss": 1.1531, "step": 15828 }, { "epoch": 0.48, "learning_rate": 2.8081391524247248e-06, "loss": 1.2607, "step": 15829 }, { "epoch": 0.48, "learning_rate": 2.8078970908126625e-06, "loss": 1.2229, "step": 15830 }, { "epoch": 0.48, "learning_rate": 2.8076550262695686e-06, "loss": 1.1131, "step": 15831 }, { "epoch": 0.48, "learning_rate": 2.8074129587977473e-06, "loss": 1.0975, "step": 15832 }, { "epoch": 0.48, "learning_rate": 2.8071708883995025e-06, "loss": 1.1271, "step": 15833 }, { "epoch": 0.48, "learning_rate": 2.806928815077139e-06, "loss": 1.2087, "step": 15834 }, { "epoch": 0.48, "learning_rate": 2.806686738832961e-06, "loss": 1.1649, "step": 15835 }, { "epoch": 0.48, "learning_rate": 2.8064446596692727e-06, "loss": 1.121, "step": 15836 }, { "epoch": 0.48, "learning_rate": 2.806202577588379e-06, "loss": 1.0818, "step": 15837 }, { "epoch": 0.48, "learning_rate": 2.8059604925925844e-06, "loss": 1.2614, "step": 15838 }, { "epoch": 0.48, "learning_rate": 2.805718404684193e-06, "loss": 1.1164, "step": 15839 }, { "epoch": 0.48, "learning_rate": 2.8054763138655093e-06, "loss": 1.0414, "step": 15840 }, { "epoch": 0.48, "learning_rate": 2.8052342201388387e-06, "loss": 1.2001, "step": 15841 }, { "epoch": 0.48, "learning_rate": 2.804992123506485e-06, "loss": 1.1055, "step": 15842 }, { "epoch": 0.48, "learning_rate": 2.804750023970753e-06, "loss": 1.2184, "step": 15843 }, { "epoch": 0.48, "learning_rate": 2.804507921533948e-06, "loss": 1.2592, "step": 15844 }, { "epoch": 0.48, "learning_rate": 2.8042658161983743e-06, "loss": 1.17, "step": 15845 }, { "epoch": 0.48, "learning_rate": 2.804023707966336e-06, "loss": 1.0128, "step": 15846 }, { "epoch": 0.48, "learning_rate": 2.8037815968401393e-06, "loss": 0.9963, "step": 15847 }, { "epoch": 0.48, "learning_rate": 2.8035394828220876e-06, "loss": 1.007, "step": 15848 }, { "epoch": 0.48, "learning_rate": 2.803297365914487e-06, "loss": 1.2304, "step": 15849 }, { "epoch": 0.48, "learning_rate": 2.8030552461196404e-06, "loss": 1.0334, "step": 15850 }, { "epoch": 0.48, "learning_rate": 2.8028131234398544e-06, "loss": 1.1462, "step": 15851 }, { "epoch": 0.48, "learning_rate": 2.8025709978774327e-06, "loss": 1.1263, "step": 15852 }, { "epoch": 0.48, "learning_rate": 2.802328869434681e-06, "loss": 1.1093, "step": 15853 }, { "epoch": 0.48, "learning_rate": 2.802086738113905e-06, "loss": 1.1143, "step": 15854 }, { "epoch": 0.48, "learning_rate": 2.8018446039174075e-06, "loss": 1.1556, "step": 15855 }, { "epoch": 0.48, "learning_rate": 2.8016024668474957e-06, "loss": 1.1443, "step": 15856 }, { "epoch": 0.48, "learning_rate": 2.8013603269064733e-06, "loss": 1.1166, "step": 15857 }, { "epoch": 0.48, "learning_rate": 2.8011181840966453e-06, "loss": 1.1925, "step": 15858 }, { "epoch": 0.48, "learning_rate": 2.8008760384203175e-06, "loss": 1.1765, "step": 15859 }, { "epoch": 0.48, "learning_rate": 2.8006338898797953e-06, "loss": 1.1426, "step": 15860 }, { "epoch": 0.48, "learning_rate": 2.8003917384773825e-06, "loss": 1.2002, "step": 15861 }, { "epoch": 0.48, "learning_rate": 2.800149584215385e-06, "loss": 1.1816, "step": 15862 }, { "epoch": 0.48, "learning_rate": 2.7999074270961086e-06, "loss": 1.0948, "step": 15863 }, { "epoch": 0.48, "learning_rate": 2.7996652671218584e-06, "loss": 1.1857, "step": 15864 }, { "epoch": 0.48, "learning_rate": 2.7994231042949375e-06, "loss": 1.1375, "step": 15865 }, { "epoch": 0.48, "learning_rate": 2.7991809386176542e-06, "loss": 1.1251, "step": 15866 }, { "epoch": 0.48, "learning_rate": 2.798938770092312e-06, "loss": 1.083, "step": 15867 }, { "epoch": 0.48, "learning_rate": 2.7986965987212165e-06, "loss": 1.0687, "step": 15868 }, { "epoch": 0.48, "learning_rate": 2.798454424506674e-06, "loss": 1.0422, "step": 15869 }, { "epoch": 0.48, "learning_rate": 2.798212247450988e-06, "loss": 1.124, "step": 15870 }, { "epoch": 0.48, "learning_rate": 2.797970067556466e-06, "loss": 1.0912, "step": 15871 }, { "epoch": 0.48, "learning_rate": 2.797727884825412e-06, "loss": 1.0186, "step": 15872 }, { "epoch": 0.48, "learning_rate": 2.7974856992601317e-06, "loss": 1.2622, "step": 15873 }, { "epoch": 0.48, "learning_rate": 2.7972435108629315e-06, "loss": 1.2587, "step": 15874 }, { "epoch": 0.48, "learning_rate": 2.7970013196361157e-06, "loss": 1.2162, "step": 15875 }, { "epoch": 0.48, "learning_rate": 2.7967591255819903e-06, "loss": 1.1089, "step": 15876 }, { "epoch": 0.48, "learning_rate": 2.7965169287028614e-06, "loss": 1.1506, "step": 15877 }, { "epoch": 0.48, "learning_rate": 2.7962747290010337e-06, "loss": 1.102, "step": 15878 }, { "epoch": 0.48, "learning_rate": 2.796032526478814e-06, "loss": 1.1649, "step": 15879 }, { "epoch": 0.48, "learning_rate": 2.7957903211385067e-06, "loss": 1.2628, "step": 15880 }, { "epoch": 0.48, "learning_rate": 2.795548112982418e-06, "loss": 1.1657, "step": 15881 }, { "epoch": 0.48, "learning_rate": 2.7953059020128535e-06, "loss": 1.1932, "step": 15882 }, { "epoch": 0.48, "learning_rate": 2.7950636882321193e-06, "loss": 1.1118, "step": 15883 }, { "epoch": 0.48, "learning_rate": 2.79482147164252e-06, "loss": 1.1571, "step": 15884 }, { "epoch": 0.48, "learning_rate": 2.7945792522463634e-06, "loss": 1.1457, "step": 15885 }, { "epoch": 0.48, "learning_rate": 2.7943370300459544e-06, "loss": 1.2512, "step": 15886 }, { "epoch": 0.48, "learning_rate": 2.794094805043598e-06, "loss": 1.0766, "step": 15887 }, { "epoch": 0.48, "learning_rate": 2.7938525772416008e-06, "loss": 1.2145, "step": 15888 }, { "epoch": 0.48, "learning_rate": 2.793610346642268e-06, "loss": 1.0289, "step": 15889 }, { "epoch": 0.48, "learning_rate": 2.7933681132479076e-06, "loss": 1.0585, "step": 15890 }, { "epoch": 0.48, "learning_rate": 2.7931258770608226e-06, "loss": 1.1281, "step": 15891 }, { "epoch": 0.48, "learning_rate": 2.7928836380833215e-06, "loss": 1.1946, "step": 15892 }, { "epoch": 0.48, "learning_rate": 2.7926413963177085e-06, "loss": 1.1229, "step": 15893 }, { "epoch": 0.48, "learning_rate": 2.79239915176629e-06, "loss": 1.0831, "step": 15894 }, { "epoch": 0.48, "learning_rate": 2.7921569044313736e-06, "loss": 1.1061, "step": 15895 }, { "epoch": 0.48, "learning_rate": 2.791914654315263e-06, "loss": 1.081, "step": 15896 }, { "epoch": 0.48, "learning_rate": 2.791672401420266e-06, "loss": 1.0427, "step": 15897 }, { "epoch": 0.48, "learning_rate": 2.7914301457486882e-06, "loss": 1.1341, "step": 15898 }, { "epoch": 0.48, "learning_rate": 2.7911878873028353e-06, "loss": 1.001, "step": 15899 }, { "epoch": 0.48, "learning_rate": 2.790945626085014e-06, "loss": 1.1184, "step": 15900 }, { "epoch": 0.48, "learning_rate": 2.7907033620975315e-06, "loss": 1.2368, "step": 15901 }, { "epoch": 0.48, "learning_rate": 2.7904610953426924e-06, "loss": 1.0264, "step": 15902 }, { "epoch": 0.48, "learning_rate": 2.7902188258228035e-06, "loss": 1.1085, "step": 15903 }, { "epoch": 0.48, "learning_rate": 2.7899765535401715e-06, "loss": 1.1982, "step": 15904 }, { "epoch": 0.48, "learning_rate": 2.7897342784971022e-06, "loss": 1.1452, "step": 15905 }, { "epoch": 0.48, "learning_rate": 2.789492000695902e-06, "loss": 1.2686, "step": 15906 }, { "epoch": 0.48, "learning_rate": 2.789249720138877e-06, "loss": 1.0075, "step": 15907 }, { "epoch": 0.48, "learning_rate": 2.7890074368283345e-06, "loss": 1.1171, "step": 15908 }, { "epoch": 0.48, "learning_rate": 2.7887651507665804e-06, "loss": 1.0785, "step": 15909 }, { "epoch": 0.48, "learning_rate": 2.7885228619559206e-06, "loss": 1.1324, "step": 15910 }, { "epoch": 0.48, "learning_rate": 2.7882805703986625e-06, "loss": 1.0767, "step": 15911 }, { "epoch": 0.48, "learning_rate": 2.788038276097112e-06, "loss": 1.2861, "step": 15912 }, { "epoch": 0.48, "learning_rate": 2.787795979053576e-06, "loss": 1.0555, "step": 15913 }, { "epoch": 0.48, "learning_rate": 2.787553679270361e-06, "loss": 1.0328, "step": 15914 }, { "epoch": 0.48, "learning_rate": 2.7873113767497734e-06, "loss": 1.0788, "step": 15915 }, { "epoch": 0.48, "learning_rate": 2.78706907149412e-06, "loss": 1.1522, "step": 15916 }, { "epoch": 0.48, "learning_rate": 2.7868267635057066e-06, "loss": 1.2133, "step": 15917 }, { "epoch": 0.48, "learning_rate": 2.786584452786842e-06, "loss": 1.1829, "step": 15918 }, { "epoch": 0.48, "learning_rate": 2.78634213933983e-06, "loss": 1.231, "step": 15919 }, { "epoch": 0.48, "learning_rate": 2.7860998231669788e-06, "loss": 1.092, "step": 15920 }, { "epoch": 0.48, "learning_rate": 2.785857504270596e-06, "loss": 1.0593, "step": 15921 }, { "epoch": 0.48, "learning_rate": 2.7856151826529865e-06, "loss": 1.0176, "step": 15922 }, { "epoch": 0.48, "learning_rate": 2.785372858316459e-06, "loss": 1.0851, "step": 15923 }, { "epoch": 0.48, "learning_rate": 2.7851305312633185e-06, "loss": 1.1845, "step": 15924 }, { "epoch": 0.48, "learning_rate": 2.7848882014958727e-06, "loss": 1.0592, "step": 15925 }, { "epoch": 0.48, "learning_rate": 2.7846458690164285e-06, "loss": 1.1414, "step": 15926 }, { "epoch": 0.48, "learning_rate": 2.7844035338272932e-06, "loss": 1.1316, "step": 15927 }, { "epoch": 0.48, "learning_rate": 2.784161195930773e-06, "loss": 1.0996, "step": 15928 }, { "epoch": 0.48, "learning_rate": 2.7839188553291753e-06, "loss": 1.1293, "step": 15929 }, { "epoch": 0.48, "learning_rate": 2.7836765120248067e-06, "loss": 1.2014, "step": 15930 }, { "epoch": 0.48, "learning_rate": 2.7834341660199743e-06, "loss": 1.1342, "step": 15931 }, { "epoch": 0.48, "learning_rate": 2.783191817316985e-06, "loss": 0.9939, "step": 15932 }, { "epoch": 0.48, "learning_rate": 2.7829494659181454e-06, "loss": 1.1471, "step": 15933 }, { "epoch": 0.48, "learning_rate": 2.782707111825764e-06, "loss": 1.0997, "step": 15934 }, { "epoch": 0.48, "learning_rate": 2.782464755042147e-06, "loss": 1.114, "step": 15935 }, { "epoch": 0.48, "learning_rate": 2.7822223955696015e-06, "loss": 1.1665, "step": 15936 }, { "epoch": 0.48, "learning_rate": 2.7819800334104346e-06, "loss": 1.1671, "step": 15937 }, { "epoch": 0.48, "learning_rate": 2.781737668566954e-06, "loss": 1.1064, "step": 15938 }, { "epoch": 0.48, "learning_rate": 2.781495301041466e-06, "loss": 1.1514, "step": 15939 }, { "epoch": 0.48, "learning_rate": 2.781252930836278e-06, "loss": 1.1168, "step": 15940 }, { "epoch": 0.48, "learning_rate": 2.781010557953698e-06, "loss": 1.0792, "step": 15941 }, { "epoch": 0.48, "learning_rate": 2.7807681823960325e-06, "loss": 1.1866, "step": 15942 }, { "epoch": 0.48, "learning_rate": 2.7805258041655893e-06, "loss": 1.0875, "step": 15943 }, { "epoch": 0.48, "learning_rate": 2.7802834232646758e-06, "loss": 1.0889, "step": 15944 }, { "epoch": 0.48, "learning_rate": 2.780041039695599e-06, "loss": 1.1226, "step": 15945 }, { "epoch": 0.48, "learning_rate": 2.779798653460667e-06, "loss": 1.1023, "step": 15946 }, { "epoch": 0.48, "learning_rate": 2.7795562645621853e-06, "loss": 1.0813, "step": 15947 }, { "epoch": 0.48, "learning_rate": 2.7793138730024632e-06, "loss": 1.1802, "step": 15948 }, { "epoch": 0.48, "learning_rate": 2.7790714787838073e-06, "loss": 1.1487, "step": 15949 }, { "epoch": 0.48, "learning_rate": 2.7788290819085257e-06, "loss": 1.0972, "step": 15950 }, { "epoch": 0.48, "learning_rate": 2.778586682378926e-06, "loss": 1.0242, "step": 15951 }, { "epoch": 0.48, "learning_rate": 2.7783442801973145e-06, "loss": 1.115, "step": 15952 }, { "epoch": 0.48, "learning_rate": 2.7781018753659994e-06, "loss": 1.0715, "step": 15953 }, { "epoch": 0.48, "learning_rate": 2.7778594678872883e-06, "loss": 1.0953, "step": 15954 }, { "epoch": 0.48, "learning_rate": 2.77761705776349e-06, "loss": 1.0111, "step": 15955 }, { "epoch": 0.48, "learning_rate": 2.7773746449969097e-06, "loss": 1.1254, "step": 15956 }, { "epoch": 0.48, "learning_rate": 2.777132229589857e-06, "loss": 1.0551, "step": 15957 }, { "epoch": 0.48, "learning_rate": 2.7768898115446384e-06, "loss": 1.1159, "step": 15958 }, { "epoch": 0.48, "learning_rate": 2.776647390863563e-06, "loss": 1.2104, "step": 15959 }, { "epoch": 0.48, "learning_rate": 2.776404967548937e-06, "loss": 1.0636, "step": 15960 }, { "epoch": 0.48, "learning_rate": 2.776162541603069e-06, "loss": 1.1579, "step": 15961 }, { "epoch": 0.48, "learning_rate": 2.7759201130282676e-06, "loss": 1.2128, "step": 15962 }, { "epoch": 0.48, "learning_rate": 2.775677681826838e-06, "loss": 1.0276, "step": 15963 }, { "epoch": 0.48, "learning_rate": 2.775435248001091e-06, "loss": 1.109, "step": 15964 }, { "epoch": 0.48, "learning_rate": 2.7751928115533323e-06, "loss": 1.1409, "step": 15965 }, { "epoch": 0.48, "learning_rate": 2.7749503724858705e-06, "loss": 1.1539, "step": 15966 }, { "epoch": 0.48, "learning_rate": 2.7747079308010137e-06, "loss": 1.1566, "step": 15967 }, { "epoch": 0.48, "learning_rate": 2.77446548650107e-06, "loss": 1.1265, "step": 15968 }, { "epoch": 0.48, "learning_rate": 2.774223039588347e-06, "loss": 1.0158, "step": 15969 }, { "epoch": 0.48, "learning_rate": 2.7739805900651526e-06, "loss": 1.041, "step": 15970 }, { "epoch": 0.48, "learning_rate": 2.7737381379337954e-06, "loss": 1.17, "step": 15971 }, { "epoch": 0.48, "learning_rate": 2.7734956831965827e-06, "loss": 1.1996, "step": 15972 }, { "epoch": 0.48, "learning_rate": 2.773253225855822e-06, "loss": 1.177, "step": 15973 }, { "epoch": 0.48, "learning_rate": 2.7730107659138227e-06, "loss": 1.1345, "step": 15974 }, { "epoch": 0.48, "learning_rate": 2.772768303372893e-06, "loss": 1.1562, "step": 15975 }, { "epoch": 0.48, "learning_rate": 2.7725258382353397e-06, "loss": 1.0854, "step": 15976 }, { "epoch": 0.48, "learning_rate": 2.7722833705034723e-06, "loss": 1.2116, "step": 15977 }, { "epoch": 0.48, "learning_rate": 2.7720409001795977e-06, "loss": 1.0856, "step": 15978 }, { "epoch": 0.48, "learning_rate": 2.7717984272660253e-06, "loss": 1.2396, "step": 15979 }, { "epoch": 0.48, "learning_rate": 2.7715559517650624e-06, "loss": 1.0737, "step": 15980 }, { "epoch": 0.48, "learning_rate": 2.7713134736790177e-06, "loss": 1.2092, "step": 15981 }, { "epoch": 0.48, "learning_rate": 2.771070993010199e-06, "loss": 1.1055, "step": 15982 }, { "epoch": 0.48, "learning_rate": 2.7708285097609157e-06, "loss": 1.124, "step": 15983 }, { "epoch": 0.48, "learning_rate": 2.7705860239334748e-06, "loss": 1.1552, "step": 15984 }, { "epoch": 0.48, "learning_rate": 2.770343535530186e-06, "loss": 1.1707, "step": 15985 }, { "epoch": 0.48, "learning_rate": 2.7701010445533564e-06, "loss": 1.1041, "step": 15986 }, { "epoch": 0.48, "learning_rate": 2.769858551005295e-06, "loss": 1.2188, "step": 15987 }, { "epoch": 0.48, "learning_rate": 2.7696160548883107e-06, "loss": 1.0878, "step": 15988 }, { "epoch": 0.48, "learning_rate": 2.7693735562047104e-06, "loss": 1.0731, "step": 15989 }, { "epoch": 0.48, "learning_rate": 2.7691310549568047e-06, "loss": 1.1761, "step": 15990 }, { "epoch": 0.48, "learning_rate": 2.7688885511469e-06, "loss": 1.1047, "step": 15991 }, { "epoch": 0.48, "learning_rate": 2.7686460447773067e-06, "loss": 1.1591, "step": 15992 }, { "epoch": 0.48, "learning_rate": 2.7684035358503316e-06, "loss": 1.1494, "step": 15993 }, { "epoch": 0.48, "learning_rate": 2.7681610243682845e-06, "loss": 1.2322, "step": 15994 }, { "epoch": 0.48, "learning_rate": 2.7679185103334733e-06, "loss": 1.1709, "step": 15995 }, { "epoch": 0.48, "learning_rate": 2.7676759937482073e-06, "loss": 1.0615, "step": 15996 }, { "epoch": 0.48, "learning_rate": 2.7674334746147948e-06, "loss": 1.2061, "step": 15997 }, { "epoch": 0.48, "learning_rate": 2.7671909529355447e-06, "loss": 0.9898, "step": 15998 }, { "epoch": 0.48, "learning_rate": 2.7669484287127647e-06, "loss": 1.1786, "step": 15999 }, { "epoch": 0.48, "learning_rate": 2.766705901948764e-06, "loss": 1.0267, "step": 16000 }, { "epoch": 0.48, "learning_rate": 2.7664633726458523e-06, "loss": 1.1178, "step": 16001 }, { "epoch": 0.48, "learning_rate": 2.7662208408063373e-06, "loss": 1.0682, "step": 16002 }, { "epoch": 0.48, "learning_rate": 2.7659783064325286e-06, "loss": 1.0961, "step": 16003 }, { "epoch": 0.48, "learning_rate": 2.765735769526734e-06, "loss": 1.0317, "step": 16004 }, { "epoch": 0.48, "learning_rate": 2.765493230091263e-06, "loss": 1.1462, "step": 16005 }, { "epoch": 0.48, "learning_rate": 2.765250688128424e-06, "loss": 1.269, "step": 16006 }, { "epoch": 0.48, "learning_rate": 2.765008143640526e-06, "loss": 1.1854, "step": 16007 }, { "epoch": 0.48, "learning_rate": 2.7647655966298786e-06, "loss": 1.1203, "step": 16008 }, { "epoch": 0.48, "learning_rate": 2.7645230470987905e-06, "loss": 1.0847, "step": 16009 }, { "epoch": 0.48, "learning_rate": 2.76428049504957e-06, "loss": 1.1017, "step": 16010 }, { "epoch": 0.48, "learning_rate": 2.764037940484527e-06, "loss": 1.0447, "step": 16011 }, { "epoch": 0.48, "learning_rate": 2.7637953834059693e-06, "loss": 1.1434, "step": 16012 }, { "epoch": 0.48, "learning_rate": 2.7635528238162066e-06, "loss": 1.1839, "step": 16013 }, { "epoch": 0.48, "learning_rate": 2.7633102617175484e-06, "loss": 1.1732, "step": 16014 }, { "epoch": 0.48, "learning_rate": 2.7630676971123033e-06, "loss": 1.1641, "step": 16015 }, { "epoch": 0.48, "learning_rate": 2.7628251300027803e-06, "loss": 1.1755, "step": 16016 }, { "epoch": 0.48, "learning_rate": 2.762582560391288e-06, "loss": 1.1737, "step": 16017 }, { "epoch": 0.48, "learning_rate": 2.7623399882801375e-06, "loss": 1.1424, "step": 16018 }, { "epoch": 0.48, "learning_rate": 2.7620974136716353e-06, "loss": 1.1116, "step": 16019 }, { "epoch": 0.48, "learning_rate": 2.761854836568093e-06, "loss": 1.2014, "step": 16020 }, { "epoch": 0.48, "learning_rate": 2.7616122569718186e-06, "loss": 1.1093, "step": 16021 }, { "epoch": 0.48, "learning_rate": 2.761369674885121e-06, "loss": 1.1188, "step": 16022 }, { "epoch": 0.48, "learning_rate": 2.76112709031031e-06, "loss": 1.2332, "step": 16023 }, { "epoch": 0.48, "learning_rate": 2.7608845032496955e-06, "loss": 1.1252, "step": 16024 }, { "epoch": 0.48, "learning_rate": 2.760641913705586e-06, "loss": 1.005, "step": 16025 }, { "epoch": 0.48, "learning_rate": 2.76039932168029e-06, "loss": 1.1461, "step": 16026 }, { "epoch": 0.48, "learning_rate": 2.7601567271761194e-06, "loss": 1.0936, "step": 16027 }, { "epoch": 0.48, "learning_rate": 2.7599141301953807e-06, "loss": 1.1173, "step": 16028 }, { "epoch": 0.48, "learning_rate": 2.759671530740386e-06, "loss": 1.1788, "step": 16029 }, { "epoch": 0.48, "learning_rate": 2.7594289288134423e-06, "loss": 1.1644, "step": 16030 }, { "epoch": 0.48, "learning_rate": 2.759186324416861e-06, "loss": 1.1646, "step": 16031 }, { "epoch": 0.48, "learning_rate": 2.75894371755295e-06, "loss": 1.075, "step": 16032 }, { "epoch": 0.48, "learning_rate": 2.75870110822402e-06, "loss": 1.1077, "step": 16033 }, { "epoch": 0.48, "learning_rate": 2.7584584964323796e-06, "loss": 1.1254, "step": 16034 }, { "epoch": 0.48, "learning_rate": 2.7582158821803383e-06, "loss": 1.1395, "step": 16035 }, { "epoch": 0.48, "learning_rate": 2.7579732654702066e-06, "loss": 1.1824, "step": 16036 }, { "epoch": 0.48, "learning_rate": 2.7577306463042948e-06, "loss": 1.105, "step": 16037 }, { "epoch": 0.48, "learning_rate": 2.75748802468491e-06, "loss": 1.1101, "step": 16038 }, { "epoch": 0.48, "learning_rate": 2.757245400614364e-06, "loss": 1.0481, "step": 16039 }, { "epoch": 0.48, "learning_rate": 2.7570027740949652e-06, "loss": 1.0468, "step": 16040 }, { "epoch": 0.48, "learning_rate": 2.7567601451290236e-06, "loss": 1.0306, "step": 16041 }, { "epoch": 0.48, "learning_rate": 2.75651751371885e-06, "loss": 1.147, "step": 16042 }, { "epoch": 0.48, "learning_rate": 2.756274879866752e-06, "loss": 1.1215, "step": 16043 }, { "epoch": 0.48, "learning_rate": 2.756032243575042e-06, "loss": 1.2065, "step": 16044 }, { "epoch": 0.48, "learning_rate": 2.755789604846027e-06, "loss": 1.2151, "step": 16045 }, { "epoch": 0.48, "learning_rate": 2.7555469636820194e-06, "loss": 1.1773, "step": 16046 }, { "epoch": 0.48, "learning_rate": 2.755304320085327e-06, "loss": 0.9988, "step": 16047 }, { "epoch": 0.48, "learning_rate": 2.7550616740582595e-06, "loss": 1.0742, "step": 16048 }, { "epoch": 0.48, "learning_rate": 2.754819025603129e-06, "loss": 1.1843, "step": 16049 }, { "epoch": 0.48, "learning_rate": 2.754576374722244e-06, "loss": 1.1708, "step": 16050 }, { "epoch": 0.48, "learning_rate": 2.7543337214179145e-06, "loss": 1.0774, "step": 16051 }, { "epoch": 0.48, "learning_rate": 2.7540910656924504e-06, "loss": 1.084, "step": 16052 }, { "epoch": 0.48, "learning_rate": 2.7538484075481613e-06, "loss": 1.0947, "step": 16053 }, { "epoch": 0.48, "learning_rate": 2.753605746987358e-06, "loss": 1.1231, "step": 16054 }, { "epoch": 0.48, "learning_rate": 2.7533630840123503e-06, "loss": 1.2329, "step": 16055 }, { "epoch": 0.48, "learning_rate": 2.753120418625448e-06, "loss": 1.1182, "step": 16056 }, { "epoch": 0.48, "learning_rate": 2.752877750828961e-06, "loss": 1.0246, "step": 16057 }, { "epoch": 0.48, "learning_rate": 2.7526350806251996e-06, "loss": 1.1885, "step": 16058 }, { "epoch": 0.48, "learning_rate": 2.7523924080164745e-06, "loss": 1.1606, "step": 16059 }, { "epoch": 0.48, "learning_rate": 2.7521497330050947e-06, "loss": 1.1003, "step": 16060 }, { "epoch": 0.48, "learning_rate": 2.7519070555933704e-06, "loss": 1.1291, "step": 16061 }, { "epoch": 0.48, "learning_rate": 2.751664375783613e-06, "loss": 1.1488, "step": 16062 }, { "epoch": 0.48, "learning_rate": 2.751421693578131e-06, "loss": 1.1351, "step": 16063 }, { "epoch": 0.48, "learning_rate": 2.7511790089792367e-06, "loss": 1.036, "step": 16064 }, { "epoch": 0.48, "learning_rate": 2.750936321989239e-06, "loss": 1.1066, "step": 16065 }, { "epoch": 0.48, "learning_rate": 2.7506936326104477e-06, "loss": 0.9763, "step": 16066 }, { "epoch": 0.48, "learning_rate": 2.7504509408451742e-06, "loss": 1.1485, "step": 16067 }, { "epoch": 0.48, "learning_rate": 2.7502082466957287e-06, "loss": 1.2507, "step": 16068 }, { "epoch": 0.48, "learning_rate": 2.7499655501644206e-06, "loss": 1.185, "step": 16069 }, { "epoch": 0.48, "learning_rate": 2.749722851253561e-06, "loss": 1.142, "step": 16070 }, { "epoch": 0.48, "learning_rate": 2.7494801499654604e-06, "loss": 1.0369, "step": 16071 }, { "epoch": 0.48, "learning_rate": 2.7492374463024293e-06, "loss": 1.1508, "step": 16072 }, { "epoch": 0.48, "learning_rate": 2.7489947402667767e-06, "loss": 1.1635, "step": 16073 }, { "epoch": 0.48, "learning_rate": 2.748752031860815e-06, "loss": 1.2188, "step": 16074 }, { "epoch": 0.48, "learning_rate": 2.748509321086853e-06, "loss": 1.2054, "step": 16075 }, { "epoch": 0.48, "learning_rate": 2.748266607947202e-06, "loss": 1.1135, "step": 16076 }, { "epoch": 0.48, "learning_rate": 2.7480238924441727e-06, "loss": 1.1978, "step": 16077 }, { "epoch": 0.48, "learning_rate": 2.747781174580076e-06, "loss": 1.1237, "step": 16078 }, { "epoch": 0.48, "learning_rate": 2.747538454357221e-06, "loss": 1.2153, "step": 16079 }, { "epoch": 0.48, "learning_rate": 2.747295731777919e-06, "loss": 1.1854, "step": 16080 }, { "epoch": 0.48, "learning_rate": 2.7470530068444816e-06, "loss": 1.0599, "step": 16081 }, { "epoch": 0.48, "learning_rate": 2.746810279559218e-06, "loss": 1.1895, "step": 16082 }, { "epoch": 0.48, "learning_rate": 2.74656754992444e-06, "loss": 1.1599, "step": 16083 }, { "epoch": 0.48, "learning_rate": 2.7463248179424567e-06, "loss": 1.0601, "step": 16084 }, { "epoch": 0.48, "learning_rate": 2.746082083615581e-06, "loss": 1.211, "step": 16085 }, { "epoch": 0.48, "learning_rate": 2.7458393469461212e-06, "loss": 1.1449, "step": 16086 }, { "epoch": 0.48, "learning_rate": 2.74559660793639e-06, "loss": 1.2852, "step": 16087 }, { "epoch": 0.48, "learning_rate": 2.745353866588697e-06, "loss": 1.0952, "step": 16088 }, { "epoch": 0.48, "learning_rate": 2.7451111229053534e-06, "loss": 1.1298, "step": 16089 }, { "epoch": 0.48, "learning_rate": 2.7448683768886695e-06, "loss": 1.1102, "step": 16090 }, { "epoch": 0.48, "learning_rate": 2.7446256285409578e-06, "loss": 1.0709, "step": 16091 }, { "epoch": 0.48, "learning_rate": 2.7443828778645267e-06, "loss": 1.1812, "step": 16092 }, { "epoch": 0.48, "learning_rate": 2.7441401248616883e-06, "loss": 1.1577, "step": 16093 }, { "epoch": 0.48, "learning_rate": 2.743897369534755e-06, "loss": 1.1987, "step": 16094 }, { "epoch": 0.48, "learning_rate": 2.7436546118860345e-06, "loss": 1.0576, "step": 16095 }, { "epoch": 0.48, "learning_rate": 2.7434118519178404e-06, "loss": 1.1311, "step": 16096 }, { "epoch": 0.48, "learning_rate": 2.7431690896324827e-06, "loss": 1.1349, "step": 16097 }, { "epoch": 0.48, "learning_rate": 2.7429263250322725e-06, "loss": 1.0914, "step": 16098 }, { "epoch": 0.48, "learning_rate": 2.74268355811952e-06, "loss": 1.0321, "step": 16099 }, { "epoch": 0.49, "learning_rate": 2.7424407888965377e-06, "loss": 1.167, "step": 16100 }, { "epoch": 0.49, "learning_rate": 2.742198017365635e-06, "loss": 1.0995, "step": 16101 }, { "epoch": 0.49, "learning_rate": 2.7419552435291234e-06, "loss": 1.1304, "step": 16102 }, { "epoch": 0.49, "learning_rate": 2.7417124673893158e-06, "loss": 1.2036, "step": 16103 }, { "epoch": 0.49, "learning_rate": 2.7414696889485216e-06, "loss": 1.0356, "step": 16104 }, { "epoch": 0.49, "learning_rate": 2.7412269082090514e-06, "loss": 1.1152, "step": 16105 }, { "epoch": 0.49, "learning_rate": 2.740984125173218e-06, "loss": 1.2353, "step": 16106 }, { "epoch": 0.49, "learning_rate": 2.7407413398433314e-06, "loss": 1.0413, "step": 16107 }, { "epoch": 0.49, "learning_rate": 2.740498552221703e-06, "loss": 1.0149, "step": 16108 }, { "epoch": 0.49, "learning_rate": 2.740255762310645e-06, "loss": 1.119, "step": 16109 }, { "epoch": 0.49, "learning_rate": 2.740012970112467e-06, "loss": 1.165, "step": 16110 }, { "epoch": 0.49, "learning_rate": 2.7397701756294826e-06, "loss": 1.1661, "step": 16111 }, { "epoch": 0.49, "learning_rate": 2.7395273788640005e-06, "loss": 1.2197, "step": 16112 }, { "epoch": 0.49, "learning_rate": 2.739284579818333e-06, "loss": 1.1774, "step": 16113 }, { "epoch": 0.49, "learning_rate": 2.7390417784947914e-06, "loss": 1.153, "step": 16114 }, { "epoch": 0.49, "learning_rate": 2.7387989748956884e-06, "loss": 1.0751, "step": 16115 }, { "epoch": 0.49, "learning_rate": 2.7385561690233324e-06, "loss": 1.1922, "step": 16116 }, { "epoch": 0.49, "learning_rate": 2.738313360880038e-06, "loss": 1.2065, "step": 16117 }, { "epoch": 0.49, "learning_rate": 2.738070550468114e-06, "loss": 1.0917, "step": 16118 }, { "epoch": 0.49, "learning_rate": 2.737827737789873e-06, "loss": 1.1201, "step": 16119 }, { "epoch": 0.49, "learning_rate": 2.737584922847628e-06, "loss": 1.1282, "step": 16120 }, { "epoch": 0.49, "learning_rate": 2.7373421056436876e-06, "loss": 1.1486, "step": 16121 }, { "epoch": 0.49, "learning_rate": 2.7370992861803657e-06, "loss": 1.0176, "step": 16122 }, { "epoch": 0.49, "learning_rate": 2.736856464459972e-06, "loss": 1.1735, "step": 16123 }, { "epoch": 0.49, "learning_rate": 2.7366136404848193e-06, "loss": 1.1764, "step": 16124 }, { "epoch": 0.49, "learning_rate": 2.736370814257218e-06, "loss": 1.188, "step": 16125 }, { "epoch": 0.49, "learning_rate": 2.7361279857794814e-06, "loss": 1.1405, "step": 16126 }, { "epoch": 0.49, "learning_rate": 2.7358851550539195e-06, "loss": 1.0406, "step": 16127 }, { "epoch": 0.49, "learning_rate": 2.735642322082845e-06, "loss": 1.0134, "step": 16128 }, { "epoch": 0.49, "learning_rate": 2.7353994868685685e-06, "loss": 1.0696, "step": 16129 }, { "epoch": 0.49, "learning_rate": 2.735156649413402e-06, "loss": 1.2159, "step": 16130 }, { "epoch": 0.49, "learning_rate": 2.7349138097196577e-06, "loss": 1.0328, "step": 16131 }, { "epoch": 0.49, "learning_rate": 2.734670967789648e-06, "loss": 1.2195, "step": 16132 }, { "epoch": 0.49, "learning_rate": 2.7344281236256826e-06, "loss": 1.1967, "step": 16133 }, { "epoch": 0.49, "learning_rate": 2.7341852772300743e-06, "loss": 1.1661, "step": 16134 }, { "epoch": 0.49, "learning_rate": 2.733942428605136e-06, "loss": 1.0835, "step": 16135 }, { "epoch": 0.49, "learning_rate": 2.7336995777531773e-06, "loss": 1.1985, "step": 16136 }, { "epoch": 0.49, "learning_rate": 2.733456724676512e-06, "loss": 1.1201, "step": 16137 }, { "epoch": 0.49, "learning_rate": 2.7332138693774508e-06, "loss": 1.1113, "step": 16138 }, { "epoch": 0.49, "learning_rate": 2.732971011858306e-06, "loss": 1.1176, "step": 16139 }, { "epoch": 0.49, "learning_rate": 2.732728152121389e-06, "loss": 1.1664, "step": 16140 }, { "epoch": 0.49, "learning_rate": 2.732485290169013e-06, "loss": 0.9858, "step": 16141 }, { "epoch": 0.49, "learning_rate": 2.732242426003488e-06, "loss": 1.071, "step": 16142 }, { "epoch": 0.49, "learning_rate": 2.731999559627127e-06, "loss": 1.0351, "step": 16143 }, { "epoch": 0.49, "learning_rate": 2.7317566910422428e-06, "loss": 1.1217, "step": 16144 }, { "epoch": 0.49, "learning_rate": 2.7315138202511454e-06, "loss": 1.1962, "step": 16145 }, { "epoch": 0.49, "learning_rate": 2.7312709472561484e-06, "loss": 1.0366, "step": 16146 }, { "epoch": 0.49, "learning_rate": 2.7310280720595633e-06, "loss": 1.0448, "step": 16147 }, { "epoch": 0.49, "learning_rate": 2.7307851946637025e-06, "loss": 1.1024, "step": 16148 }, { "epoch": 0.49, "learning_rate": 2.730542315070878e-06, "loss": 1.1063, "step": 16149 }, { "epoch": 0.49, "learning_rate": 2.7302994332834014e-06, "loss": 1.1545, "step": 16150 }, { "epoch": 0.49, "learning_rate": 2.730056549303585e-06, "loss": 1.0533, "step": 16151 }, { "epoch": 0.49, "learning_rate": 2.7298136631337412e-06, "loss": 1.1269, "step": 16152 }, { "epoch": 0.49, "learning_rate": 2.7295707747761818e-06, "loss": 1.1809, "step": 16153 }, { "epoch": 0.49, "learning_rate": 2.7293278842332193e-06, "loss": 1.1437, "step": 16154 }, { "epoch": 0.49, "learning_rate": 2.729084991507166e-06, "loss": 1.0942, "step": 16155 }, { "epoch": 0.49, "learning_rate": 2.7288420966003336e-06, "loss": 1.1827, "step": 16156 }, { "epoch": 0.49, "learning_rate": 2.728599199515035e-06, "loss": 1.124, "step": 16157 }, { "epoch": 0.49, "learning_rate": 2.7283563002535816e-06, "loss": 1.0665, "step": 16158 }, { "epoch": 0.49, "learning_rate": 2.7281133988182862e-06, "loss": 1.0693, "step": 16159 }, { "epoch": 0.49, "learning_rate": 2.727870495211461e-06, "loss": 1.1979, "step": 16160 }, { "epoch": 0.49, "learning_rate": 2.7276275894354194e-06, "loss": 1.2285, "step": 16161 }, { "epoch": 0.49, "learning_rate": 2.727384681492472e-06, "loss": 1.1289, "step": 16162 }, { "epoch": 0.49, "learning_rate": 2.7271417713849326e-06, "loss": 1.1462, "step": 16163 }, { "epoch": 0.49, "learning_rate": 2.7268988591151125e-06, "loss": 0.9995, "step": 16164 }, { "epoch": 0.49, "learning_rate": 2.7266559446853246e-06, "loss": 1.0909, "step": 16165 }, { "epoch": 0.49, "learning_rate": 2.7264130280978807e-06, "loss": 1.0823, "step": 16166 }, { "epoch": 0.49, "learning_rate": 2.7261701093550946e-06, "loss": 1.1763, "step": 16167 }, { "epoch": 0.49, "learning_rate": 2.7259271884592773e-06, "loss": 1.3292, "step": 16168 }, { "epoch": 0.49, "learning_rate": 2.725684265412743e-06, "loss": 1.0997, "step": 16169 }, { "epoch": 0.49, "learning_rate": 2.7254413402178025e-06, "loss": 1.1576, "step": 16170 }, { "epoch": 0.49, "learning_rate": 2.725198412876769e-06, "loss": 1.1338, "step": 16171 }, { "epoch": 0.49, "learning_rate": 2.724955483391955e-06, "loss": 1.1196, "step": 16172 }, { "epoch": 0.49, "learning_rate": 2.724712551765673e-06, "loss": 1.2173, "step": 16173 }, { "epoch": 0.49, "learning_rate": 2.724469618000236e-06, "loss": 1.1686, "step": 16174 }, { "epoch": 0.49, "learning_rate": 2.724226682097956e-06, "loss": 1.1, "step": 16175 }, { "epoch": 0.49, "learning_rate": 2.7239837440611473e-06, "loss": 1.1018, "step": 16176 }, { "epoch": 0.49, "learning_rate": 2.72374080389212e-06, "loss": 1.1727, "step": 16177 }, { "epoch": 0.49, "learning_rate": 2.723497861593188e-06, "loss": 1.0082, "step": 16178 }, { "epoch": 0.49, "learning_rate": 2.7232549171666644e-06, "loss": 1.0677, "step": 16179 }, { "epoch": 0.49, "learning_rate": 2.7230119706148617e-06, "loss": 1.1005, "step": 16180 }, { "epoch": 0.49, "learning_rate": 2.722769021940092e-06, "loss": 1.1389, "step": 16181 }, { "epoch": 0.49, "learning_rate": 2.722526071144669e-06, "loss": 1.0229, "step": 16182 }, { "epoch": 0.49, "learning_rate": 2.7222831182309047e-06, "loss": 1.1027, "step": 16183 }, { "epoch": 0.49, "learning_rate": 2.722040163201112e-06, "loss": 1.0336, "step": 16184 }, { "epoch": 0.49, "learning_rate": 2.7217972060576035e-06, "loss": 1.0279, "step": 16185 }, { "epoch": 0.49, "learning_rate": 2.721554246802693e-06, "loss": 0.9888, "step": 16186 }, { "epoch": 0.49, "learning_rate": 2.7213112854386926e-06, "loss": 1.1224, "step": 16187 }, { "epoch": 0.49, "learning_rate": 2.721068321967915e-06, "loss": 1.1281, "step": 16188 }, { "epoch": 0.49, "learning_rate": 2.7208253563926747e-06, "loss": 1.1609, "step": 16189 }, { "epoch": 0.49, "learning_rate": 2.7205823887152815e-06, "loss": 1.0848, "step": 16190 }, { "epoch": 0.49, "learning_rate": 2.720339418938052e-06, "loss": 1.1535, "step": 16191 }, { "epoch": 0.49, "learning_rate": 2.720096447063296e-06, "loss": 1.0323, "step": 16192 }, { "epoch": 0.49, "learning_rate": 2.719853473093329e-06, "loss": 1.0972, "step": 16193 }, { "epoch": 0.49, "learning_rate": 2.719610497030462e-06, "loss": 1.0518, "step": 16194 }, { "epoch": 0.49, "learning_rate": 2.7193675188770093e-06, "loss": 1.1384, "step": 16195 }, { "epoch": 0.49, "learning_rate": 2.7191245386352834e-06, "loss": 1.2073, "step": 16196 }, { "epoch": 0.49, "learning_rate": 2.718881556307597e-06, "loss": 1.1428, "step": 16197 }, { "epoch": 0.49, "learning_rate": 2.7186385718962637e-06, "loss": 1.1469, "step": 16198 }, { "epoch": 0.49, "learning_rate": 2.7183955854035964e-06, "loss": 1.0115, "step": 16199 }, { "epoch": 0.49, "learning_rate": 2.7181525968319084e-06, "loss": 1.1637, "step": 16200 }, { "epoch": 0.49, "learning_rate": 2.7179096061835133e-06, "loss": 1.153, "step": 16201 }, { "epoch": 0.49, "learning_rate": 2.7176666134607234e-06, "loss": 1.2159, "step": 16202 }, { "epoch": 0.49, "learning_rate": 2.7174236186658513e-06, "loss": 1.1008, "step": 16203 }, { "epoch": 0.49, "learning_rate": 2.7171806218012126e-06, "loss": 1.1016, "step": 16204 }, { "epoch": 0.49, "learning_rate": 2.716937622869118e-06, "loss": 1.1647, "step": 16205 }, { "epoch": 0.49, "learning_rate": 2.716694621871882e-06, "loss": 1.0443, "step": 16206 }, { "epoch": 0.49, "learning_rate": 2.7164516188118173e-06, "loss": 1.1197, "step": 16207 }, { "epoch": 0.49, "learning_rate": 2.716208613691238e-06, "loss": 1.2527, "step": 16208 }, { "epoch": 0.49, "learning_rate": 2.715965606512456e-06, "loss": 1.1545, "step": 16209 }, { "epoch": 0.49, "learning_rate": 2.7157225972777864e-06, "loss": 0.9782, "step": 16210 }, { "epoch": 0.49, "learning_rate": 2.715479585989541e-06, "loss": 1.0524, "step": 16211 }, { "epoch": 0.49, "learning_rate": 2.7152365726500334e-06, "loss": 1.0975, "step": 16212 }, { "epoch": 0.49, "learning_rate": 2.714993557261578e-06, "loss": 1.1462, "step": 16213 }, { "epoch": 0.49, "learning_rate": 2.714750539826486e-06, "loss": 1.0798, "step": 16214 }, { "epoch": 0.49, "learning_rate": 2.714507520347074e-06, "loss": 1.0593, "step": 16215 }, { "epoch": 0.49, "learning_rate": 2.7142644988256527e-06, "loss": 1.0996, "step": 16216 }, { "epoch": 0.49, "learning_rate": 2.7140214752645376e-06, "loss": 1.1531, "step": 16217 }, { "epoch": 0.49, "learning_rate": 2.71377844966604e-06, "loss": 1.184, "step": 16218 }, { "epoch": 0.49, "learning_rate": 2.713535422032476e-06, "loss": 1.1413, "step": 16219 }, { "epoch": 0.49, "learning_rate": 2.7132923923661565e-06, "loss": 1.1027, "step": 16220 }, { "epoch": 0.49, "learning_rate": 2.713049360669396e-06, "loss": 1.2507, "step": 16221 }, { "epoch": 0.49, "learning_rate": 2.7128063269445086e-06, "loss": 1.1148, "step": 16222 }, { "epoch": 0.49, "learning_rate": 2.7125632911938075e-06, "loss": 1.065, "step": 16223 }, { "epoch": 0.49, "learning_rate": 2.7123202534196065e-06, "loss": 1.2606, "step": 16224 }, { "epoch": 0.49, "learning_rate": 2.712077213624218e-06, "loss": 1.0832, "step": 16225 }, { "epoch": 0.49, "learning_rate": 2.711834171809958e-06, "loss": 1.1629, "step": 16226 }, { "epoch": 0.49, "learning_rate": 2.711591127979137e-06, "loss": 1.1162, "step": 16227 }, { "epoch": 0.49, "learning_rate": 2.711348082134071e-06, "loss": 1.2245, "step": 16228 }, { "epoch": 0.49, "learning_rate": 2.7111050342770734e-06, "loss": 1.0168, "step": 16229 }, { "epoch": 0.49, "learning_rate": 2.7108619844104577e-06, "loss": 1.2194, "step": 16230 }, { "epoch": 0.49, "learning_rate": 2.710618932536537e-06, "loss": 1.2864, "step": 16231 }, { "epoch": 0.49, "learning_rate": 2.710375878657626e-06, "loss": 1.1174, "step": 16232 }, { "epoch": 0.49, "learning_rate": 2.710132822776037e-06, "loss": 1.1466, "step": 16233 }, { "epoch": 0.49, "learning_rate": 2.709889764894086e-06, "loss": 1.0679, "step": 16234 }, { "epoch": 0.49, "learning_rate": 2.7096467050140847e-06, "loss": 1.2128, "step": 16235 }, { "epoch": 0.49, "learning_rate": 2.709403643138348e-06, "loss": 1.1299, "step": 16236 }, { "epoch": 0.49, "learning_rate": 2.7091605792691893e-06, "loss": 1.1202, "step": 16237 }, { "epoch": 0.49, "learning_rate": 2.708917513408923e-06, "loss": 1.1326, "step": 16238 }, { "epoch": 0.49, "learning_rate": 2.7086744455598625e-06, "loss": 1.1417, "step": 16239 }, { "epoch": 0.49, "learning_rate": 2.708431375724321e-06, "loss": 0.9979, "step": 16240 }, { "epoch": 0.49, "learning_rate": 2.7081883039046136e-06, "loss": 1.075, "step": 16241 }, { "epoch": 0.49, "learning_rate": 2.707945230103054e-06, "loss": 1.1306, "step": 16242 }, { "epoch": 0.49, "learning_rate": 2.7077021543219563e-06, "loss": 1.2521, "step": 16243 }, { "epoch": 0.49, "learning_rate": 2.707459076563633e-06, "loss": 1.0849, "step": 16244 }, { "epoch": 0.49, "learning_rate": 2.7072159968304007e-06, "loss": 1.2342, "step": 16245 }, { "epoch": 0.49, "learning_rate": 2.7069729151245712e-06, "loss": 0.9863, "step": 16246 }, { "epoch": 0.49, "learning_rate": 2.7067298314484592e-06, "loss": 1.0994, "step": 16247 }, { "epoch": 0.49, "learning_rate": 2.706486745804379e-06, "loss": 1.0363, "step": 16248 }, { "epoch": 0.49, "learning_rate": 2.7062436581946437e-06, "loss": 1.1758, "step": 16249 }, { "epoch": 0.49, "learning_rate": 2.706000568621569e-06, "loss": 1.1384, "step": 16250 }, { "epoch": 0.49, "learning_rate": 2.705757477087468e-06, "loss": 1.1237, "step": 16251 }, { "epoch": 0.49, "learning_rate": 2.705514383594654e-06, "loss": 1.071, "step": 16252 }, { "epoch": 0.49, "learning_rate": 2.705271288145443e-06, "loss": 1.2394, "step": 16253 }, { "epoch": 0.49, "learning_rate": 2.7050281907421473e-06, "loss": 1.0516, "step": 16254 }, { "epoch": 0.49, "learning_rate": 2.704785091387082e-06, "loss": 1.2152, "step": 16255 }, { "epoch": 0.49, "learning_rate": 2.7045419900825626e-06, "loss": 1.2141, "step": 16256 }, { "epoch": 0.49, "learning_rate": 2.7042988868309004e-06, "loss": 1.1366, "step": 16257 }, { "epoch": 0.49, "learning_rate": 2.7040557816344125e-06, "loss": 1.1832, "step": 16258 }, { "epoch": 0.49, "learning_rate": 2.7038126744954112e-06, "loss": 1.1533, "step": 16259 }, { "epoch": 0.49, "learning_rate": 2.703569565416212e-06, "loss": 1.1017, "step": 16260 }, { "epoch": 0.49, "learning_rate": 2.703326454399128e-06, "loss": 1.1273, "step": 16261 }, { "epoch": 0.49, "learning_rate": 2.703083341446474e-06, "loss": 1.1221, "step": 16262 }, { "epoch": 0.49, "learning_rate": 2.7028402265605645e-06, "loss": 1.1063, "step": 16263 }, { "epoch": 0.49, "learning_rate": 2.702597109743714e-06, "loss": 1.0961, "step": 16264 }, { "epoch": 0.49, "learning_rate": 2.7023539909982367e-06, "loss": 1.1641, "step": 16265 }, { "epoch": 0.49, "learning_rate": 2.702110870326446e-06, "loss": 1.0535, "step": 16266 }, { "epoch": 0.49, "learning_rate": 2.701867747730658e-06, "loss": 1.0539, "step": 16267 }, { "epoch": 0.49, "learning_rate": 2.701624623213186e-06, "loss": 1.3209, "step": 16268 }, { "epoch": 0.49, "learning_rate": 2.701381496776344e-06, "loss": 1.2203, "step": 16269 }, { "epoch": 0.49, "learning_rate": 2.701138368422448e-06, "loss": 1.1614, "step": 16270 }, { "epoch": 0.49, "learning_rate": 2.700895238153811e-06, "loss": 1.0237, "step": 16271 }, { "epoch": 0.49, "learning_rate": 2.7006521059727488e-06, "loss": 1.0729, "step": 16272 }, { "epoch": 0.49, "learning_rate": 2.700408971881575e-06, "loss": 1.1751, "step": 16273 }, { "epoch": 0.49, "learning_rate": 2.700165835882604e-06, "loss": 1.1071, "step": 16274 }, { "epoch": 0.49, "learning_rate": 2.6999226979781514e-06, "loss": 1.0557, "step": 16275 }, { "epoch": 0.49, "learning_rate": 2.6996795581705297e-06, "loss": 1.1005, "step": 16276 }, { "epoch": 0.49, "learning_rate": 2.6994364164620564e-06, "loss": 1.1377, "step": 16277 }, { "epoch": 0.49, "learning_rate": 2.699193272855043e-06, "loss": 1.1104, "step": 16278 }, { "epoch": 0.49, "learning_rate": 2.6989501273518058e-06, "loss": 1.2094, "step": 16279 }, { "epoch": 0.49, "learning_rate": 2.69870697995466e-06, "loss": 1.1356, "step": 16280 }, { "epoch": 0.49, "learning_rate": 2.698463830665919e-06, "loss": 1.1298, "step": 16281 }, { "epoch": 0.49, "learning_rate": 2.6982206794878973e-06, "loss": 1.0122, "step": 16282 }, { "epoch": 0.49, "learning_rate": 2.6979775264229107e-06, "loss": 1.1778, "step": 16283 }, { "epoch": 0.49, "learning_rate": 2.697734371473274e-06, "loss": 1.165, "step": 16284 }, { "epoch": 0.49, "learning_rate": 2.6974912146413006e-06, "loss": 1.2074, "step": 16285 }, { "epoch": 0.49, "learning_rate": 2.6972480559293062e-06, "loss": 1.1784, "step": 16286 }, { "epoch": 0.49, "learning_rate": 2.697004895339605e-06, "loss": 1.1812, "step": 16287 }, { "epoch": 0.49, "learning_rate": 2.6967617328745127e-06, "loss": 1.1143, "step": 16288 }, { "epoch": 0.49, "learning_rate": 2.6965185685363433e-06, "loss": 1.1572, "step": 16289 }, { "epoch": 0.49, "learning_rate": 2.696275402327412e-06, "loss": 1.0795, "step": 16290 }, { "epoch": 0.49, "learning_rate": 2.696032234250032e-06, "loss": 1.1423, "step": 16291 }, { "epoch": 0.49, "learning_rate": 2.695789064306521e-06, "loss": 1.2546, "step": 16292 }, { "epoch": 0.49, "learning_rate": 2.6955458924991924e-06, "loss": 1.0999, "step": 16293 }, { "epoch": 0.49, "learning_rate": 2.6953027188303597e-06, "loss": 1.1105, "step": 16294 }, { "epoch": 0.49, "learning_rate": 2.69505954330234e-06, "loss": 1.0972, "step": 16295 }, { "epoch": 0.49, "learning_rate": 2.6948163659174476e-06, "loss": 1.1732, "step": 16296 }, { "epoch": 0.49, "learning_rate": 2.6945731866779973e-06, "loss": 1.2339, "step": 16297 }, { "epoch": 0.49, "learning_rate": 2.6943300055863036e-06, "loss": 1.1475, "step": 16298 }, { "epoch": 0.49, "learning_rate": 2.6940868226446827e-06, "loss": 1.1474, "step": 16299 }, { "epoch": 0.49, "learning_rate": 2.693843637855448e-06, "loss": 1.1157, "step": 16300 }, { "epoch": 0.49, "learning_rate": 2.693600451220915e-06, "loss": 1.1985, "step": 16301 }, { "epoch": 0.49, "learning_rate": 2.693357262743399e-06, "loss": 1.114, "step": 16302 }, { "epoch": 0.49, "learning_rate": 2.693114072425216e-06, "loss": 1.2533, "step": 16303 }, { "epoch": 0.49, "learning_rate": 2.6928708802686788e-06, "loss": 1.2197, "step": 16304 }, { "epoch": 0.49, "learning_rate": 2.6926276862761036e-06, "loss": 1.0855, "step": 16305 }, { "epoch": 0.49, "learning_rate": 2.692384490449807e-06, "loss": 1.1702, "step": 16306 }, { "epoch": 0.49, "learning_rate": 2.6921412927921015e-06, "loss": 1.1601, "step": 16307 }, { "epoch": 0.49, "learning_rate": 2.6918980933053035e-06, "loss": 1.0528, "step": 16308 }, { "epoch": 0.49, "learning_rate": 2.6916548919917286e-06, "loss": 1.0484, "step": 16309 }, { "epoch": 0.49, "learning_rate": 2.6914116888536913e-06, "loss": 1.2371, "step": 16310 }, { "epoch": 0.49, "learning_rate": 2.6911684838935066e-06, "loss": 1.1931, "step": 16311 }, { "epoch": 0.49, "learning_rate": 2.69092527711349e-06, "loss": 1.2063, "step": 16312 }, { "epoch": 0.49, "learning_rate": 2.6906820685159567e-06, "loss": 1.1242, "step": 16313 }, { "epoch": 0.49, "learning_rate": 2.6904388581032226e-06, "loss": 1.1718, "step": 16314 }, { "epoch": 0.49, "learning_rate": 2.690195645877602e-06, "loss": 1.033, "step": 16315 }, { "epoch": 0.49, "learning_rate": 2.6899524318414103e-06, "loss": 1.0667, "step": 16316 }, { "epoch": 0.49, "learning_rate": 2.6897092159969628e-06, "loss": 1.1906, "step": 16317 }, { "epoch": 0.49, "learning_rate": 2.6894659983465753e-06, "loss": 1.0877, "step": 16318 }, { "epoch": 0.49, "learning_rate": 2.6892227788925625e-06, "loss": 1.2109, "step": 16319 }, { "epoch": 0.49, "learning_rate": 2.6889795576372397e-06, "loss": 1.1696, "step": 16320 }, { "epoch": 0.49, "learning_rate": 2.688736334582923e-06, "loss": 1.1514, "step": 16321 }, { "epoch": 0.49, "learning_rate": 2.688493109731927e-06, "loss": 1.0701, "step": 16322 }, { "epoch": 0.49, "learning_rate": 2.6882498830865673e-06, "loss": 1.2657, "step": 16323 }, { "epoch": 0.49, "learning_rate": 2.6880066546491594e-06, "loss": 1.1025, "step": 16324 }, { "epoch": 0.49, "learning_rate": 2.687763424422019e-06, "loss": 1.2386, "step": 16325 }, { "epoch": 0.49, "learning_rate": 2.687520192407461e-06, "loss": 1.1917, "step": 16326 }, { "epoch": 0.49, "learning_rate": 2.6872769586078018e-06, "loss": 1.1006, "step": 16327 }, { "epoch": 0.49, "learning_rate": 2.687033723025355e-06, "loss": 1.0901, "step": 16328 }, { "epoch": 0.49, "learning_rate": 2.686790485662438e-06, "loss": 1.1181, "step": 16329 }, { "epoch": 0.49, "learning_rate": 2.686547246521365e-06, "loss": 1.157, "step": 16330 }, { "epoch": 0.49, "learning_rate": 2.6863040056044533e-06, "loss": 1.186, "step": 16331 }, { "epoch": 0.49, "learning_rate": 2.6860607629140156e-06, "loss": 1.073, "step": 16332 }, { "epoch": 0.49, "learning_rate": 2.6858175184523694e-06, "loss": 1.0871, "step": 16333 }, { "epoch": 0.49, "learning_rate": 2.6855742722218303e-06, "loss": 1.0262, "step": 16334 }, { "epoch": 0.49, "learning_rate": 2.6853310242247134e-06, "loss": 1.141, "step": 16335 }, { "epoch": 0.49, "learning_rate": 2.685087774463334e-06, "loss": 1.1243, "step": 16336 }, { "epoch": 0.49, "learning_rate": 2.684844522940009e-06, "loss": 1.2472, "step": 16337 }, { "epoch": 0.49, "learning_rate": 2.6846012696570527e-06, "loss": 1.0868, "step": 16338 }, { "epoch": 0.49, "learning_rate": 2.6843580146167806e-06, "loss": 1.1002, "step": 16339 }, { "epoch": 0.49, "learning_rate": 2.6841147578215105e-06, "loss": 1.2405, "step": 16340 }, { "epoch": 0.49, "learning_rate": 2.6838714992735555e-06, "loss": 1.1787, "step": 16341 }, { "epoch": 0.49, "learning_rate": 2.683628238975233e-06, "loss": 1.1547, "step": 16342 }, { "epoch": 0.49, "learning_rate": 2.6833849769288573e-06, "loss": 1.112, "step": 16343 }, { "epoch": 0.49, "learning_rate": 2.6831417131367456e-06, "loss": 1.1737, "step": 16344 }, { "epoch": 0.49, "learning_rate": 2.6828984476012127e-06, "loss": 1.111, "step": 16345 }, { "epoch": 0.49, "learning_rate": 2.6826551803245743e-06, "loss": 1.0966, "step": 16346 }, { "epoch": 0.49, "learning_rate": 2.682411911309147e-06, "loss": 1.1732, "step": 16347 }, { "epoch": 0.49, "learning_rate": 2.682168640557246e-06, "loss": 1.1445, "step": 16348 }, { "epoch": 0.49, "learning_rate": 2.681925368071187e-06, "loss": 1.2224, "step": 16349 }, { "epoch": 0.49, "learning_rate": 2.6816820938532873e-06, "loss": 1.209, "step": 16350 }, { "epoch": 0.49, "learning_rate": 2.68143881790586e-06, "loss": 1.1494, "step": 16351 }, { "epoch": 0.49, "learning_rate": 2.6811955402312232e-06, "loss": 1.0744, "step": 16352 }, { "epoch": 0.49, "learning_rate": 2.680952260831693e-06, "loss": 1.0465, "step": 16353 }, { "epoch": 0.49, "learning_rate": 2.6807089797095833e-06, "loss": 1.1115, "step": 16354 }, { "epoch": 0.49, "learning_rate": 2.6804656968672115e-06, "loss": 1.1699, "step": 16355 }, { "epoch": 0.49, "learning_rate": 2.6802224123068933e-06, "loss": 1.2184, "step": 16356 }, { "epoch": 0.49, "learning_rate": 2.6799791260309447e-06, "loss": 1.123, "step": 16357 }, { "epoch": 0.49, "learning_rate": 2.679735838041681e-06, "loss": 1.0979, "step": 16358 }, { "epoch": 0.49, "learning_rate": 2.6794925483414187e-06, "loss": 1.1146, "step": 16359 }, { "epoch": 0.49, "learning_rate": 2.679249256932474e-06, "loss": 1.2062, "step": 16360 }, { "epoch": 0.49, "learning_rate": 2.679005963817163e-06, "loss": 1.027, "step": 16361 }, { "epoch": 0.49, "learning_rate": 2.678762668997801e-06, "loss": 1.1417, "step": 16362 }, { "epoch": 0.49, "learning_rate": 2.6785193724767045e-06, "loss": 1.1116, "step": 16363 }, { "epoch": 0.49, "learning_rate": 2.67827607425619e-06, "loss": 1.0894, "step": 16364 }, { "epoch": 0.49, "learning_rate": 2.678032774338572e-06, "loss": 1.0458, "step": 16365 }, { "epoch": 0.49, "learning_rate": 2.677789472726169e-06, "loss": 1.0014, "step": 16366 }, { "epoch": 0.49, "learning_rate": 2.677546169421295e-06, "loss": 1.1577, "step": 16367 }, { "epoch": 0.49, "learning_rate": 2.6773028644262676e-06, "loss": 1.1682, "step": 16368 }, { "epoch": 0.49, "learning_rate": 2.677059557743402e-06, "loss": 1.1899, "step": 16369 }, { "epoch": 0.49, "learning_rate": 2.676816249375015e-06, "loss": 1.0936, "step": 16370 }, { "epoch": 0.49, "learning_rate": 2.676572939323422e-06, "loss": 1.0131, "step": 16371 }, { "epoch": 0.49, "learning_rate": 2.6763296275909394e-06, "loss": 0.9768, "step": 16372 }, { "epoch": 0.49, "learning_rate": 2.676086314179885e-06, "loss": 1.1167, "step": 16373 }, { "epoch": 0.49, "learning_rate": 2.6758429990925727e-06, "loss": 1.0216, "step": 16374 }, { "epoch": 0.49, "learning_rate": 2.67559968233132e-06, "loss": 1.1259, "step": 16375 }, { "epoch": 0.49, "learning_rate": 2.6753563638984424e-06, "loss": 1.123, "step": 16376 }, { "epoch": 0.49, "learning_rate": 2.6751130437962567e-06, "loss": 1.1638, "step": 16377 }, { "epoch": 0.49, "learning_rate": 2.6748697220270797e-06, "loss": 1.1241, "step": 16378 }, { "epoch": 0.49, "learning_rate": 2.6746263985932267e-06, "loss": 1.2039, "step": 16379 }, { "epoch": 0.49, "learning_rate": 2.674383073497015e-06, "loss": 1.1835, "step": 16380 }, { "epoch": 0.49, "learning_rate": 2.6741397467407603e-06, "loss": 1.1512, "step": 16381 }, { "epoch": 0.49, "learning_rate": 2.6738964183267792e-06, "loss": 1.11, "step": 16382 }, { "epoch": 0.49, "learning_rate": 2.673653088257388e-06, "loss": 1.0912, "step": 16383 }, { "epoch": 0.49, "learning_rate": 2.673409756534902e-06, "loss": 1.0038, "step": 16384 }, { "epoch": 0.49, "learning_rate": 2.6731664231616392e-06, "loss": 1.1285, "step": 16385 }, { "epoch": 0.49, "learning_rate": 2.6729230881399165e-06, "loss": 1.0875, "step": 16386 }, { "epoch": 0.49, "learning_rate": 2.6726797514720483e-06, "loss": 1.2291, "step": 16387 }, { "epoch": 0.49, "learning_rate": 2.672436413160352e-06, "loss": 1.1127, "step": 16388 }, { "epoch": 0.49, "learning_rate": 2.6721930732071442e-06, "loss": 1.1823, "step": 16389 }, { "epoch": 0.49, "learning_rate": 2.6719497316147412e-06, "loss": 1.1365, "step": 16390 }, { "epoch": 0.49, "learning_rate": 2.6717063883854598e-06, "loss": 0.9999, "step": 16391 }, { "epoch": 0.49, "learning_rate": 2.671463043521616e-06, "loss": 1.1047, "step": 16392 }, { "epoch": 0.49, "learning_rate": 2.6712196970255267e-06, "loss": 1.1946, "step": 16393 }, { "epoch": 0.49, "learning_rate": 2.670976348899509e-06, "loss": 1.1218, "step": 16394 }, { "epoch": 0.49, "learning_rate": 2.6707329991458774e-06, "loss": 1.117, "step": 16395 }, { "epoch": 0.49, "learning_rate": 2.670489647766951e-06, "loss": 1.071, "step": 16396 }, { "epoch": 0.49, "learning_rate": 2.6702462947650447e-06, "loss": 1.154, "step": 16397 }, { "epoch": 0.49, "learning_rate": 2.670002940142476e-06, "loss": 1.1116, "step": 16398 }, { "epoch": 0.49, "learning_rate": 2.669759583901562e-06, "loss": 1.133, "step": 16399 }, { "epoch": 0.49, "learning_rate": 2.669516226044617e-06, "loss": 1.1386, "step": 16400 }, { "epoch": 0.49, "learning_rate": 2.6692728665739597e-06, "loss": 1.1048, "step": 16401 }, { "epoch": 0.49, "learning_rate": 2.6690295054919063e-06, "loss": 1.0625, "step": 16402 }, { "epoch": 0.49, "learning_rate": 2.668786142800774e-06, "loss": 1.1882, "step": 16403 }, { "epoch": 0.49, "learning_rate": 2.6685427785028783e-06, "loss": 1.2377, "step": 16404 }, { "epoch": 0.49, "learning_rate": 2.668299412600536e-06, "loss": 1.1736, "step": 16405 }, { "epoch": 0.49, "learning_rate": 2.6680560450960646e-06, "loss": 1.1854, "step": 16406 }, { "epoch": 0.49, "learning_rate": 2.6678126759917816e-06, "loss": 1.0002, "step": 16407 }, { "epoch": 0.49, "learning_rate": 2.667569305290002e-06, "loss": 1.1433, "step": 16408 }, { "epoch": 0.49, "learning_rate": 2.6673259329930435e-06, "loss": 0.9651, "step": 16409 }, { "epoch": 0.49, "learning_rate": 2.667082559103222e-06, "loss": 1.1854, "step": 16410 }, { "epoch": 0.49, "learning_rate": 2.6668391836228563e-06, "loss": 1.0206, "step": 16411 }, { "epoch": 0.49, "learning_rate": 2.666595806554261e-06, "loss": 1.2062, "step": 16412 }, { "epoch": 0.49, "learning_rate": 2.666352427899754e-06, "loss": 1.1327, "step": 16413 }, { "epoch": 0.49, "learning_rate": 2.6661090476616527e-06, "loss": 1.1321, "step": 16414 }, { "epoch": 0.49, "learning_rate": 2.6658656658422722e-06, "loss": 1.212, "step": 16415 }, { "epoch": 0.49, "learning_rate": 2.665622282443931e-06, "loss": 1.222, "step": 16416 }, { "epoch": 0.49, "learning_rate": 2.6653788974689453e-06, "loss": 1.15, "step": 16417 }, { "epoch": 0.49, "learning_rate": 2.665135510919632e-06, "loss": 1.1836, "step": 16418 }, { "epoch": 0.49, "learning_rate": 2.6648921227983083e-06, "loss": 1.1082, "step": 16419 }, { "epoch": 0.49, "learning_rate": 2.664648733107291e-06, "loss": 1.0963, "step": 16420 }, { "epoch": 0.49, "learning_rate": 2.664405341848897e-06, "loss": 1.0835, "step": 16421 }, { "epoch": 0.49, "learning_rate": 2.664161949025444e-06, "loss": 1.1815, "step": 16422 }, { "epoch": 0.49, "learning_rate": 2.663918554639247e-06, "loss": 1.153, "step": 16423 }, { "epoch": 0.49, "learning_rate": 2.6636751586926255e-06, "loss": 1.1642, "step": 16424 }, { "epoch": 0.49, "learning_rate": 2.6634317611878945e-06, "loss": 1.2688, "step": 16425 }, { "epoch": 0.49, "learning_rate": 2.6631883621273723e-06, "loss": 1.1171, "step": 16426 }, { "epoch": 0.49, "learning_rate": 2.6629449615133755e-06, "loss": 1.1241, "step": 16427 }, { "epoch": 0.49, "learning_rate": 2.662701559348221e-06, "loss": 1.0867, "step": 16428 }, { "epoch": 0.49, "learning_rate": 2.6624581556342268e-06, "loss": 1.0283, "step": 16429 }, { "epoch": 0.49, "learning_rate": 2.662214750373708e-06, "loss": 1.1674, "step": 16430 }, { "epoch": 0.49, "learning_rate": 2.661971343568983e-06, "loss": 1.1182, "step": 16431 }, { "epoch": 0.5, "learning_rate": 2.6617279352223695e-06, "loss": 1.0688, "step": 16432 }, { "epoch": 0.5, "learning_rate": 2.661484525336183e-06, "loss": 1.0829, "step": 16433 }, { "epoch": 0.5, "learning_rate": 2.6612411139127424e-06, "loss": 1.0527, "step": 16434 }, { "epoch": 0.5, "learning_rate": 2.660997700954364e-06, "loss": 1.1825, "step": 16435 }, { "epoch": 0.5, "learning_rate": 2.660754286463365e-06, "loss": 1.1137, "step": 16436 }, { "epoch": 0.5, "learning_rate": 2.6605108704420627e-06, "loss": 1.176, "step": 16437 }, { "epoch": 0.5, "learning_rate": 2.6602674528927743e-06, "loss": 1.1696, "step": 16438 }, { "epoch": 0.5, "learning_rate": 2.6600240338178164e-06, "loss": 1.2024, "step": 16439 }, { "epoch": 0.5, "learning_rate": 2.659780613219507e-06, "loss": 1.16, "step": 16440 }, { "epoch": 0.5, "learning_rate": 2.6595371911001625e-06, "loss": 0.9632, "step": 16441 }, { "epoch": 0.5, "learning_rate": 2.6592937674621023e-06, "loss": 1.1301, "step": 16442 }, { "epoch": 0.5, "learning_rate": 2.659050342307641e-06, "loss": 0.9903, "step": 16443 }, { "epoch": 0.5, "learning_rate": 2.658806915639098e-06, "loss": 1.0276, "step": 16444 }, { "epoch": 0.5, "learning_rate": 2.6585634874587882e-06, "loss": 1.1776, "step": 16445 }, { "epoch": 0.5, "learning_rate": 2.658320057769031e-06, "loss": 1.1405, "step": 16446 }, { "epoch": 0.5, "learning_rate": 2.658076626572143e-06, "loss": 1.1509, "step": 16447 }, { "epoch": 0.5, "learning_rate": 2.657833193870442e-06, "loss": 1.0981, "step": 16448 }, { "epoch": 0.5, "learning_rate": 2.6575897596662448e-06, "loss": 1.162, "step": 16449 }, { "epoch": 0.5, "learning_rate": 2.65734632396187e-06, "loss": 1.0261, "step": 16450 }, { "epoch": 0.5, "learning_rate": 2.6571028867596327e-06, "loss": 0.9948, "step": 16451 }, { "epoch": 0.5, "learning_rate": 2.6568594480618514e-06, "loss": 1.1669, "step": 16452 }, { "epoch": 0.5, "learning_rate": 2.6566160078708446e-06, "loss": 1.0821, "step": 16453 }, { "epoch": 0.5, "learning_rate": 2.6563725661889285e-06, "loss": 1.2504, "step": 16454 }, { "epoch": 0.5, "learning_rate": 2.656129123018421e-06, "loss": 1.1358, "step": 16455 }, { "epoch": 0.5, "learning_rate": 2.655885678361639e-06, "loss": 1.1837, "step": 16456 }, { "epoch": 0.5, "learning_rate": 2.6556422322209006e-06, "loss": 1.2019, "step": 16457 }, { "epoch": 0.5, "learning_rate": 2.6553987845985235e-06, "loss": 1.0967, "step": 16458 }, { "epoch": 0.5, "learning_rate": 2.655155335496824e-06, "loss": 1.1907, "step": 16459 }, { "epoch": 0.5, "learning_rate": 2.654911884918121e-06, "loss": 1.2303, "step": 16460 }, { "epoch": 0.5, "learning_rate": 2.654668432864732e-06, "loss": 1.1834, "step": 16461 }, { "epoch": 0.5, "learning_rate": 2.6544249793389733e-06, "loss": 1.2109, "step": 16462 }, { "epoch": 0.5, "learning_rate": 2.6541815243431634e-06, "loss": 1.1489, "step": 16463 }, { "epoch": 0.5, "learning_rate": 2.6539380678796194e-06, "loss": 1.1683, "step": 16464 }, { "epoch": 0.5, "learning_rate": 2.653694609950659e-06, "loss": 1.096, "step": 16465 }, { "epoch": 0.5, "learning_rate": 2.6534511505586e-06, "loss": 1.109, "step": 16466 }, { "epoch": 0.5, "learning_rate": 2.6532076897057607e-06, "loss": 1.1473, "step": 16467 }, { "epoch": 0.5, "learning_rate": 2.652964227394458e-06, "loss": 1.0883, "step": 16468 }, { "epoch": 0.5, "learning_rate": 2.6527207636270086e-06, "loss": 1.1163, "step": 16469 }, { "epoch": 0.5, "learning_rate": 2.6524772984057318e-06, "loss": 1.0175, "step": 16470 }, { "epoch": 0.5, "learning_rate": 2.6522338317329438e-06, "loss": 1.1592, "step": 16471 }, { "epoch": 0.5, "learning_rate": 2.6519903636109632e-06, "loss": 1.1376, "step": 16472 }, { "epoch": 0.5, "learning_rate": 2.651746894042108e-06, "loss": 1.174, "step": 16473 }, { "epoch": 0.5, "learning_rate": 2.651503423028695e-06, "loss": 1.0832, "step": 16474 }, { "epoch": 0.5, "learning_rate": 2.6512599505730425e-06, "loss": 1.1268, "step": 16475 }, { "epoch": 0.5, "learning_rate": 2.6510164766774686e-06, "loss": 1.0908, "step": 16476 }, { "epoch": 0.5, "learning_rate": 2.65077300134429e-06, "loss": 1.1699, "step": 16477 }, { "epoch": 0.5, "learning_rate": 2.650529524575825e-06, "loss": 1.0605, "step": 16478 }, { "epoch": 0.5, "learning_rate": 2.6502860463743922e-06, "loss": 1.0557, "step": 16479 }, { "epoch": 0.5, "learning_rate": 2.650042566742308e-06, "loss": 1.1394, "step": 16480 }, { "epoch": 0.5, "learning_rate": 2.649799085681891e-06, "loss": 1.1137, "step": 16481 }, { "epoch": 0.5, "learning_rate": 2.6495556031954588e-06, "loss": 1.1036, "step": 16482 }, { "epoch": 0.5, "learning_rate": 2.649312119285329e-06, "loss": 1.118, "step": 16483 }, { "epoch": 0.5, "learning_rate": 2.6490686339538203e-06, "loss": 0.9872, "step": 16484 }, { "epoch": 0.5, "learning_rate": 2.64882514720325e-06, "loss": 1.0922, "step": 16485 }, { "epoch": 0.5, "learning_rate": 2.6485816590359354e-06, "loss": 1.1678, "step": 16486 }, { "epoch": 0.5, "learning_rate": 2.6483381694541947e-06, "loss": 1.1927, "step": 16487 }, { "epoch": 0.5, "learning_rate": 2.648094678460347e-06, "loss": 1.1893, "step": 16488 }, { "epoch": 0.5, "learning_rate": 2.647851186056709e-06, "loss": 1.0967, "step": 16489 }, { "epoch": 0.5, "learning_rate": 2.6476076922455983e-06, "loss": 1.1441, "step": 16490 }, { "epoch": 0.5, "learning_rate": 2.647364197029334e-06, "loss": 1.1124, "step": 16491 }, { "epoch": 0.5, "learning_rate": 2.647120700410234e-06, "loss": 1.1, "step": 16492 }, { "epoch": 0.5, "learning_rate": 2.646877202390615e-06, "loss": 1.1007, "step": 16493 }, { "epoch": 0.5, "learning_rate": 2.646633702972796e-06, "loss": 1.1766, "step": 16494 }, { "epoch": 0.5, "learning_rate": 2.646390202159095e-06, "loss": 1.0137, "step": 16495 }, { "epoch": 0.5, "learning_rate": 2.6461466999518296e-06, "loss": 1.0421, "step": 16496 }, { "epoch": 0.5, "learning_rate": 2.6459031963533183e-06, "loss": 1.1744, "step": 16497 }, { "epoch": 0.5, "learning_rate": 2.6456596913658788e-06, "loss": 1.1777, "step": 16498 }, { "epoch": 0.5, "learning_rate": 2.6454161849918285e-06, "loss": 1.3663, "step": 16499 }, { "epoch": 0.5, "learning_rate": 2.6451726772334863e-06, "loss": 1.1062, "step": 16500 }, { "epoch": 0.5, "learning_rate": 2.6449291680931705e-06, "loss": 1.1226, "step": 16501 }, { "epoch": 0.5, "learning_rate": 2.644685657573199e-06, "loss": 1.0723, "step": 16502 }, { "epoch": 0.5, "learning_rate": 2.644442145675889e-06, "loss": 1.2527, "step": 16503 }, { "epoch": 0.5, "learning_rate": 2.64419863240356e-06, "loss": 1.1442, "step": 16504 }, { "epoch": 0.5, "learning_rate": 2.643955117758529e-06, "loss": 1.1694, "step": 16505 }, { "epoch": 0.5, "learning_rate": 2.6437116017431154e-06, "loss": 1.1255, "step": 16506 }, { "epoch": 0.5, "learning_rate": 2.6434680843596362e-06, "loss": 0.9567, "step": 16507 }, { "epoch": 0.5, "learning_rate": 2.6432245656104092e-06, "loss": 0.9895, "step": 16508 }, { "epoch": 0.5, "learning_rate": 2.6429810454977544e-06, "loss": 1.1877, "step": 16509 }, { "epoch": 0.5, "learning_rate": 2.6427375240239883e-06, "loss": 1.129, "step": 16510 }, { "epoch": 0.5, "learning_rate": 2.64249400119143e-06, "loss": 1.1843, "step": 16511 }, { "epoch": 0.5, "learning_rate": 2.642250477002397e-06, "loss": 1.1679, "step": 16512 }, { "epoch": 0.5, "learning_rate": 2.6420069514592085e-06, "loss": 1.1343, "step": 16513 }, { "epoch": 0.5, "learning_rate": 2.641763424564182e-06, "loss": 1.0812, "step": 16514 }, { "epoch": 0.5, "learning_rate": 2.6415198963196353e-06, "loss": 1.0761, "step": 16515 }, { "epoch": 0.5, "learning_rate": 2.641276366727888e-06, "loss": 1.0593, "step": 16516 }, { "epoch": 0.5, "learning_rate": 2.641032835791258e-06, "loss": 1.1437, "step": 16517 }, { "epoch": 0.5, "learning_rate": 2.640789303512063e-06, "loss": 1.1514, "step": 16518 }, { "epoch": 0.5, "learning_rate": 2.6405457698926214e-06, "loss": 1.0845, "step": 16519 }, { "epoch": 0.5, "learning_rate": 2.640302234935252e-06, "loss": 1.1848, "step": 16520 }, { "epoch": 0.5, "learning_rate": 2.6400586986422727e-06, "loss": 1.1628, "step": 16521 }, { "epoch": 0.5, "learning_rate": 2.639815161016003e-06, "loss": 1.0733, "step": 16522 }, { "epoch": 0.5, "learning_rate": 2.639571622058759e-06, "loss": 1.1058, "step": 16523 }, { "epoch": 0.5, "learning_rate": 2.6393280817728612e-06, "loss": 0.9875, "step": 16524 }, { "epoch": 0.5, "learning_rate": 2.6390845401606268e-06, "loss": 1.252, "step": 16525 }, { "epoch": 0.5, "learning_rate": 2.6388409972243752e-06, "loss": 1.1385, "step": 16526 }, { "epoch": 0.5, "learning_rate": 2.638597452966423e-06, "loss": 1.0741, "step": 16527 }, { "epoch": 0.5, "learning_rate": 2.6383539073890907e-06, "loss": 1.0649, "step": 16528 }, { "epoch": 0.5, "learning_rate": 2.638110360494695e-06, "loss": 1.0828, "step": 16529 }, { "epoch": 0.5, "learning_rate": 2.637866812285556e-06, "loss": 1.0912, "step": 16530 }, { "epoch": 0.5, "learning_rate": 2.637623262763991e-06, "loss": 1.0361, "step": 16531 }, { "epoch": 0.5, "learning_rate": 2.6373797119323187e-06, "loss": 1.0995, "step": 16532 }, { "epoch": 0.5, "learning_rate": 2.6371361597928585e-06, "loss": 1.1426, "step": 16533 }, { "epoch": 0.5, "learning_rate": 2.636892606347927e-06, "loss": 1.1117, "step": 16534 }, { "epoch": 0.5, "learning_rate": 2.636649051599845e-06, "loss": 1.1412, "step": 16535 }, { "epoch": 0.5, "learning_rate": 2.636405495550929e-06, "loss": 1.2289, "step": 16536 }, { "epoch": 0.5, "learning_rate": 2.6361619382034985e-06, "loss": 1.1517, "step": 16537 }, { "epoch": 0.5, "learning_rate": 2.635918379559872e-06, "loss": 1.239, "step": 16538 }, { "epoch": 0.5, "learning_rate": 2.6356748196223687e-06, "loss": 1.0403, "step": 16539 }, { "epoch": 0.5, "learning_rate": 2.6354312583933052e-06, "loss": 1.0519, "step": 16540 }, { "epoch": 0.5, "learning_rate": 2.6351876958750017e-06, "loss": 1.154, "step": 16541 }, { "epoch": 0.5, "learning_rate": 2.6349441320697764e-06, "loss": 1.1201, "step": 16542 }, { "epoch": 0.5, "learning_rate": 2.6347005669799486e-06, "loss": 1.18, "step": 16543 }, { "epoch": 0.5, "learning_rate": 2.6344570006078357e-06, "loss": 1.1465, "step": 16544 }, { "epoch": 0.5, "learning_rate": 2.6342134329557565e-06, "loss": 1.079, "step": 16545 }, { "epoch": 0.5, "learning_rate": 2.6339698640260315e-06, "loss": 1.1329, "step": 16546 }, { "epoch": 0.5, "learning_rate": 2.6337262938209764e-06, "loss": 1.1494, "step": 16547 }, { "epoch": 0.5, "learning_rate": 2.633482722342913e-06, "loss": 1.2474, "step": 16548 }, { "epoch": 0.5, "learning_rate": 2.633239149594157e-06, "loss": 1.095, "step": 16549 }, { "epoch": 0.5, "learning_rate": 2.6329955755770287e-06, "loss": 1.1317, "step": 16550 }, { "epoch": 0.5, "learning_rate": 2.6327520002938467e-06, "loss": 1.1766, "step": 16551 }, { "epoch": 0.5, "learning_rate": 2.63250842374693e-06, "loss": 1.0091, "step": 16552 }, { "epoch": 0.5, "learning_rate": 2.6322648459385964e-06, "loss": 1.146, "step": 16553 }, { "epoch": 0.5, "learning_rate": 2.6320212668711647e-06, "loss": 1.1421, "step": 16554 }, { "epoch": 0.5, "learning_rate": 2.6317776865469547e-06, "loss": 1.1824, "step": 16555 }, { "epoch": 0.5, "learning_rate": 2.631534104968285e-06, "loss": 1.1598, "step": 16556 }, { "epoch": 0.5, "learning_rate": 2.6312905221374737e-06, "loss": 1.0858, "step": 16557 }, { "epoch": 0.5, "learning_rate": 2.6310469380568394e-06, "loss": 1.1255, "step": 16558 }, { "epoch": 0.5, "learning_rate": 2.6308033527287018e-06, "loss": 1.1255, "step": 16559 }, { "epoch": 0.5, "learning_rate": 2.6305597661553795e-06, "loss": 1.1444, "step": 16560 }, { "epoch": 0.5, "learning_rate": 2.6303161783391906e-06, "loss": 1.14, "step": 16561 }, { "epoch": 0.5, "learning_rate": 2.6300725892824546e-06, "loss": 1.0586, "step": 16562 }, { "epoch": 0.5, "learning_rate": 2.629828998987491e-06, "loss": 0.9861, "step": 16563 }, { "epoch": 0.5, "learning_rate": 2.6295854074566167e-06, "loss": 1.086, "step": 16564 }, { "epoch": 0.5, "learning_rate": 2.6293418146921524e-06, "loss": 1.1586, "step": 16565 }, { "epoch": 0.5, "learning_rate": 2.629098220696416e-06, "loss": 1.0521, "step": 16566 }, { "epoch": 0.5, "learning_rate": 2.6288546254717266e-06, "loss": 1.1453, "step": 16567 }, { "epoch": 0.5, "learning_rate": 2.6286110290204035e-06, "loss": 1.2411, "step": 16568 }, { "epoch": 0.5, "learning_rate": 2.628367431344765e-06, "loss": 1.2621, "step": 16569 }, { "epoch": 0.5, "learning_rate": 2.6281238324471304e-06, "loss": 1.196, "step": 16570 }, { "epoch": 0.5, "learning_rate": 2.6278802323298187e-06, "loss": 1.0553, "step": 16571 }, { "epoch": 0.5, "learning_rate": 2.6276366309951495e-06, "loss": 1.1459, "step": 16572 }, { "epoch": 0.5, "learning_rate": 2.6273930284454404e-06, "loss": 1.2091, "step": 16573 }, { "epoch": 0.5, "learning_rate": 2.627149424683011e-06, "loss": 1.1449, "step": 16574 }, { "epoch": 0.5, "learning_rate": 2.6269058197101806e-06, "loss": 1.1021, "step": 16575 }, { "epoch": 0.5, "learning_rate": 2.626662213529268e-06, "loss": 1.133, "step": 16576 }, { "epoch": 0.5, "learning_rate": 2.626418606142591e-06, "loss": 1.1454, "step": 16577 }, { "epoch": 0.5, "learning_rate": 2.6261749975524715e-06, "loss": 1.0692, "step": 16578 }, { "epoch": 0.5, "learning_rate": 2.6259313877612257e-06, "loss": 1.0551, "step": 16579 }, { "epoch": 0.5, "learning_rate": 2.625687776771174e-06, "loss": 1.1087, "step": 16580 }, { "epoch": 0.5, "learning_rate": 2.6254441645846353e-06, "loss": 1.1472, "step": 16581 }, { "epoch": 0.5, "learning_rate": 2.625200551203928e-06, "loss": 1.0444, "step": 16582 }, { "epoch": 0.5, "learning_rate": 2.624956936631372e-06, "loss": 1.0944, "step": 16583 }, { "epoch": 0.5, "learning_rate": 2.624713320869286e-06, "loss": 1.1906, "step": 16584 }, { "epoch": 0.5, "learning_rate": 2.6244697039199895e-06, "loss": 1.0756, "step": 16585 }, { "epoch": 0.5, "learning_rate": 2.6242260857858017e-06, "loss": 1.2603, "step": 16586 }, { "epoch": 0.5, "learning_rate": 2.623982466469041e-06, "loss": 1.0677, "step": 16587 }, { "epoch": 0.5, "learning_rate": 2.623738845972027e-06, "loss": 1.0778, "step": 16588 }, { "epoch": 0.5, "learning_rate": 2.623495224297079e-06, "loss": 1.1273, "step": 16589 }, { "epoch": 0.5, "learning_rate": 2.623251601446516e-06, "loss": 1.0131, "step": 16590 }, { "epoch": 0.5, "learning_rate": 2.623007977422657e-06, "loss": 1.1219, "step": 16591 }, { "epoch": 0.5, "learning_rate": 2.6227643522278213e-06, "loss": 1.1732, "step": 16592 }, { "epoch": 0.5, "learning_rate": 2.622520725864328e-06, "loss": 1.229, "step": 16593 }, { "epoch": 0.5, "learning_rate": 2.6222770983344963e-06, "loss": 1.0087, "step": 16594 }, { "epoch": 0.5, "learning_rate": 2.622033469640645e-06, "loss": 1.0571, "step": 16595 }, { "epoch": 0.5, "learning_rate": 2.6217898397850942e-06, "loss": 1.14, "step": 16596 }, { "epoch": 0.5, "learning_rate": 2.6215462087701636e-06, "loss": 1.1188, "step": 16597 }, { "epoch": 0.5, "learning_rate": 2.621302576598171e-06, "loss": 1.1362, "step": 16598 }, { "epoch": 0.5, "learning_rate": 2.621058943271436e-06, "loss": 1.1239, "step": 16599 }, { "epoch": 0.5, "learning_rate": 2.620815308792279e-06, "loss": 1.0438, "step": 16600 }, { "epoch": 0.5, "learning_rate": 2.620571673163018e-06, "loss": 1.2146, "step": 16601 }, { "epoch": 0.5, "learning_rate": 2.6203280363859724e-06, "loss": 1.2043, "step": 16602 }, { "epoch": 0.5, "learning_rate": 2.620084398463462e-06, "loss": 1.2311, "step": 16603 }, { "epoch": 0.5, "learning_rate": 2.6198407593978065e-06, "loss": 1.0746, "step": 16604 }, { "epoch": 0.5, "learning_rate": 2.6195971191913237e-06, "loss": 1.098, "step": 16605 }, { "epoch": 0.5, "learning_rate": 2.6193534778463354e-06, "loss": 1.116, "step": 16606 }, { "epoch": 0.5, "learning_rate": 2.619109835365158e-06, "loss": 1.1925, "step": 16607 }, { "epoch": 0.5, "learning_rate": 2.6188661917501136e-06, "loss": 1.0834, "step": 16608 }, { "epoch": 0.5, "learning_rate": 2.6186225470035194e-06, "loss": 1.0485, "step": 16609 }, { "epoch": 0.5, "learning_rate": 2.6183789011276955e-06, "loss": 1.1027, "step": 16610 }, { "epoch": 0.5, "learning_rate": 2.6181352541249617e-06, "loss": 1.1917, "step": 16611 }, { "epoch": 0.5, "learning_rate": 2.6178916059976374e-06, "loss": 1.082, "step": 16612 }, { "epoch": 0.5, "learning_rate": 2.617647956748042e-06, "loss": 1.2108, "step": 16613 }, { "epoch": 0.5, "learning_rate": 2.6174043063784936e-06, "loss": 1.0815, "step": 16614 }, { "epoch": 0.5, "learning_rate": 2.617160654891314e-06, "loss": 1.183, "step": 16615 }, { "epoch": 0.5, "learning_rate": 2.616917002288821e-06, "loss": 1.1263, "step": 16616 }, { "epoch": 0.5, "learning_rate": 2.6166733485733348e-06, "loss": 1.1918, "step": 16617 }, { "epoch": 0.5, "learning_rate": 2.6164296937471738e-06, "loss": 1.2331, "step": 16618 }, { "epoch": 0.5, "learning_rate": 2.616186037812659e-06, "loss": 1.0633, "step": 16619 }, { "epoch": 0.5, "learning_rate": 2.6159423807721085e-06, "loss": 1.0718, "step": 16620 }, { "epoch": 0.5, "learning_rate": 2.615698722627843e-06, "loss": 1.0929, "step": 16621 }, { "epoch": 0.5, "learning_rate": 2.6154550633821803e-06, "loss": 1.0201, "step": 16622 }, { "epoch": 0.5, "learning_rate": 2.6152114030374413e-06, "loss": 1.154, "step": 16623 }, { "epoch": 0.5, "learning_rate": 2.614967741595945e-06, "loss": 1.2108, "step": 16624 }, { "epoch": 0.5, "learning_rate": 2.614724079060012e-06, "loss": 1.0533, "step": 16625 }, { "epoch": 0.5, "learning_rate": 2.614480415431961e-06, "loss": 1.1174, "step": 16626 }, { "epoch": 0.5, "learning_rate": 2.614236750714111e-06, "loss": 1.1929, "step": 16627 }, { "epoch": 0.5, "learning_rate": 2.6139930849087823e-06, "loss": 1.14, "step": 16628 }, { "epoch": 0.5, "learning_rate": 2.613749418018295e-06, "loss": 1.112, "step": 16629 }, { "epoch": 0.5, "learning_rate": 2.6135057500449672e-06, "loss": 1.2023, "step": 16630 }, { "epoch": 0.5, "learning_rate": 2.6132620809911197e-06, "loss": 1.1484, "step": 16631 }, { "epoch": 0.5, "learning_rate": 2.6130184108590717e-06, "loss": 1.2401, "step": 16632 }, { "epoch": 0.5, "learning_rate": 2.6127747396511428e-06, "loss": 1.1431, "step": 16633 }, { "epoch": 0.5, "learning_rate": 2.612531067369653e-06, "loss": 1.0347, "step": 16634 }, { "epoch": 0.5, "learning_rate": 2.6122873940169214e-06, "loss": 1.0856, "step": 16635 }, { "epoch": 0.5, "learning_rate": 2.6120437195952677e-06, "loss": 1.1741, "step": 16636 }, { "epoch": 0.5, "learning_rate": 2.6118000441070115e-06, "loss": 1.2667, "step": 16637 }, { "epoch": 0.5, "learning_rate": 2.611556367554473e-06, "loss": 1.1116, "step": 16638 }, { "epoch": 0.5, "learning_rate": 2.6113126899399716e-06, "loss": 1.2153, "step": 16639 }, { "epoch": 0.5, "learning_rate": 2.611069011265827e-06, "loss": 1.0347, "step": 16640 }, { "epoch": 0.5, "learning_rate": 2.6108253315343598e-06, "loss": 1.1227, "step": 16641 }, { "epoch": 0.5, "learning_rate": 2.6105816507478875e-06, "loss": 1.0068, "step": 16642 }, { "epoch": 0.5, "learning_rate": 2.610337968908732e-06, "loss": 1.2175, "step": 16643 }, { "epoch": 0.5, "learning_rate": 2.610094286019211e-06, "loss": 1.1491, "step": 16644 }, { "epoch": 0.5, "learning_rate": 2.609850602081647e-06, "loss": 1.1605, "step": 16645 }, { "epoch": 0.5, "learning_rate": 2.6096069170983574e-06, "loss": 1.1201, "step": 16646 }, { "epoch": 0.5, "learning_rate": 2.6093632310716633e-06, "loss": 1.07, "step": 16647 }, { "epoch": 0.5, "learning_rate": 2.609119544003883e-06, "loss": 1.1543, "step": 16648 }, { "epoch": 0.5, "learning_rate": 2.608875855897338e-06, "loss": 1.217, "step": 16649 }, { "epoch": 0.5, "learning_rate": 2.6086321667543467e-06, "loss": 1.1596, "step": 16650 }, { "epoch": 0.5, "learning_rate": 2.6083884765772292e-06, "loss": 1.1191, "step": 16651 }, { "epoch": 0.5, "learning_rate": 2.6081447853683062e-06, "loss": 1.1636, "step": 16652 }, { "epoch": 0.5, "learning_rate": 2.6079010931298964e-06, "loss": 1.1028, "step": 16653 }, { "epoch": 0.5, "learning_rate": 2.607657399864321e-06, "loss": 1.0754, "step": 16654 }, { "epoch": 0.5, "learning_rate": 2.6074137055738986e-06, "loss": 1.1182, "step": 16655 }, { "epoch": 0.5, "learning_rate": 2.6071700102609493e-06, "loss": 1.2564, "step": 16656 }, { "epoch": 0.5, "learning_rate": 2.6069263139277933e-06, "loss": 1.0811, "step": 16657 }, { "epoch": 0.5, "learning_rate": 2.6066826165767507e-06, "loss": 1.0853, "step": 16658 }, { "epoch": 0.5, "learning_rate": 2.60643891821014e-06, "loss": 1.1833, "step": 16659 }, { "epoch": 0.5, "learning_rate": 2.6061952188302832e-06, "loss": 1.1301, "step": 16660 }, { "epoch": 0.5, "learning_rate": 2.605951518439498e-06, "loss": 1.2018, "step": 16661 }, { "epoch": 0.5, "learning_rate": 2.6057078170401063e-06, "loss": 1.1253, "step": 16662 }, { "epoch": 0.5, "learning_rate": 2.6054641146344263e-06, "loss": 1.0452, "step": 16663 }, { "epoch": 0.5, "learning_rate": 2.6052204112247785e-06, "loss": 1.0859, "step": 16664 }, { "epoch": 0.5, "learning_rate": 2.6049767068134833e-06, "loss": 1.1172, "step": 16665 }, { "epoch": 0.5, "learning_rate": 2.6047330014028603e-06, "loss": 1.1082, "step": 16666 }, { "epoch": 0.5, "learning_rate": 2.6044892949952304e-06, "loss": 1.075, "step": 16667 }, { "epoch": 0.5, "learning_rate": 2.6042455875929123e-06, "loss": 1.1638, "step": 16668 }, { "epoch": 0.5, "learning_rate": 2.604001879198227e-06, "loss": 1.2184, "step": 16669 }, { "epoch": 0.5, "learning_rate": 2.6037581698134927e-06, "loss": 1.1907, "step": 16670 }, { "epoch": 0.5, "learning_rate": 2.6035144594410316e-06, "loss": 1.1401, "step": 16671 }, { "epoch": 0.5, "learning_rate": 2.603270748083162e-06, "loss": 1.0405, "step": 16672 }, { "epoch": 0.5, "learning_rate": 2.6030270357422057e-06, "loss": 1.1776, "step": 16673 }, { "epoch": 0.5, "learning_rate": 2.60278332242048e-06, "loss": 1.1821, "step": 16674 }, { "epoch": 0.5, "learning_rate": 2.602539608120308e-06, "loss": 1.2385, "step": 16675 }, { "epoch": 0.5, "learning_rate": 2.6022958928440073e-06, "loss": 1.1855, "step": 16676 }, { "epoch": 0.5, "learning_rate": 2.6020521765938995e-06, "loss": 1.0399, "step": 16677 }, { "epoch": 0.5, "learning_rate": 2.6018084593723037e-06, "loss": 1.0009, "step": 16678 }, { "epoch": 0.5, "learning_rate": 2.601564741181541e-06, "loss": 1.1275, "step": 16679 }, { "epoch": 0.5, "learning_rate": 2.6013210220239306e-06, "loss": 1.1846, "step": 16680 }, { "epoch": 0.5, "learning_rate": 2.6010773019017925e-06, "loss": 1.2061, "step": 16681 }, { "epoch": 0.5, "learning_rate": 2.6008335808174478e-06, "loss": 0.9975, "step": 16682 }, { "epoch": 0.5, "learning_rate": 2.6005898587732157e-06, "loss": 1.2238, "step": 16683 }, { "epoch": 0.5, "learning_rate": 2.600346135771417e-06, "loss": 1.1369, "step": 16684 }, { "epoch": 0.5, "learning_rate": 2.6001024118143708e-06, "loss": 1.2011, "step": 16685 }, { "epoch": 0.5, "learning_rate": 2.5998586869043984e-06, "loss": 1.2015, "step": 16686 }, { "epoch": 0.5, "learning_rate": 2.5996149610438187e-06, "loss": 1.1436, "step": 16687 }, { "epoch": 0.5, "learning_rate": 2.599371234234953e-06, "loss": 1.1035, "step": 16688 }, { "epoch": 0.5, "learning_rate": 2.599127506480121e-06, "loss": 1.0574, "step": 16689 }, { "epoch": 0.5, "learning_rate": 2.5988837777816434e-06, "loss": 1.0038, "step": 16690 }, { "epoch": 0.5, "learning_rate": 2.598640048141839e-06, "loss": 1.0719, "step": 16691 }, { "epoch": 0.5, "learning_rate": 2.598396317563029e-06, "loss": 1.1042, "step": 16692 }, { "epoch": 0.5, "learning_rate": 2.598152586047533e-06, "loss": 1.1343, "step": 16693 }, { "epoch": 0.5, "learning_rate": 2.597908853597672e-06, "loss": 0.9987, "step": 16694 }, { "epoch": 0.5, "learning_rate": 2.5976651202157666e-06, "loss": 1.1093, "step": 16695 }, { "epoch": 0.5, "learning_rate": 2.597421385904135e-06, "loss": 1.0887, "step": 16696 }, { "epoch": 0.5, "learning_rate": 2.5971776506651003e-06, "loss": 1.0652, "step": 16697 }, { "epoch": 0.5, "learning_rate": 2.5969339145009802e-06, "loss": 1.206, "step": 16698 }, { "epoch": 0.5, "learning_rate": 2.596690177414096e-06, "loss": 1.1052, "step": 16699 }, { "epoch": 0.5, "learning_rate": 2.596446439406768e-06, "loss": 1.1631, "step": 16700 }, { "epoch": 0.5, "learning_rate": 2.5962027004813166e-06, "loss": 1.1467, "step": 16701 }, { "epoch": 0.5, "learning_rate": 2.5959589606400613e-06, "loss": 1.1895, "step": 16702 }, { "epoch": 0.5, "learning_rate": 2.5957152198853237e-06, "loss": 1.0811, "step": 16703 }, { "epoch": 0.5, "learning_rate": 2.5954714782194222e-06, "loss": 1.245, "step": 16704 }, { "epoch": 0.5, "learning_rate": 2.5952277356446785e-06, "loss": 1.1161, "step": 16705 }, { "epoch": 0.5, "learning_rate": 2.594983992163413e-06, "loss": 1.238, "step": 16706 }, { "epoch": 0.5, "learning_rate": 2.5947402477779454e-06, "loss": 1.1978, "step": 16707 }, { "epoch": 0.5, "learning_rate": 2.5944965024905965e-06, "loss": 1.1307, "step": 16708 }, { "epoch": 0.5, "learning_rate": 2.5942527563036863e-06, "loss": 1.1084, "step": 16709 }, { "epoch": 0.5, "learning_rate": 2.5940090092195353e-06, "loss": 1.1315, "step": 16710 }, { "epoch": 0.5, "learning_rate": 2.5937652612404635e-06, "loss": 1.1394, "step": 16711 }, { "epoch": 0.5, "learning_rate": 2.593521512368792e-06, "loss": 1.0763, "step": 16712 }, { "epoch": 0.5, "learning_rate": 2.5932777626068405e-06, "loss": 1.1769, "step": 16713 }, { "epoch": 0.5, "learning_rate": 2.59303401195693e-06, "loss": 1.1337, "step": 16714 }, { "epoch": 0.5, "learning_rate": 2.59279026042138e-06, "loss": 1.0856, "step": 16715 }, { "epoch": 0.5, "learning_rate": 2.5925465080025118e-06, "loss": 1.1179, "step": 16716 }, { "epoch": 0.5, "learning_rate": 2.5923027547026454e-06, "loss": 1.157, "step": 16717 }, { "epoch": 0.5, "learning_rate": 2.592059000524101e-06, "loss": 1.2821, "step": 16718 }, { "epoch": 0.5, "learning_rate": 2.591815245469199e-06, "loss": 1.1807, "step": 16719 }, { "epoch": 0.5, "learning_rate": 2.5915714895402606e-06, "loss": 1.0963, "step": 16720 }, { "epoch": 0.5, "learning_rate": 2.5913277327396053e-06, "loss": 1.1583, "step": 16721 }, { "epoch": 0.5, "learning_rate": 2.5910839750695537e-06, "loss": 1.2213, "step": 16722 }, { "epoch": 0.5, "learning_rate": 2.5908402165324276e-06, "loss": 1.212, "step": 16723 }, { "epoch": 0.5, "learning_rate": 2.590596457130546e-06, "loss": 1.1345, "step": 16724 }, { "epoch": 0.5, "learning_rate": 2.5903526968662294e-06, "loss": 1.2047, "step": 16725 }, { "epoch": 0.5, "learning_rate": 2.5901089357417987e-06, "loss": 1.0348, "step": 16726 }, { "epoch": 0.5, "learning_rate": 2.589865173759575e-06, "loss": 1.1439, "step": 16727 }, { "epoch": 0.5, "learning_rate": 2.589621410921877e-06, "loss": 1.057, "step": 16728 }, { "epoch": 0.5, "learning_rate": 2.5893776472310274e-06, "loss": 1.1127, "step": 16729 }, { "epoch": 0.5, "learning_rate": 2.589133882689345e-06, "loss": 1.0104, "step": 16730 }, { "epoch": 0.5, "learning_rate": 2.588890117299151e-06, "loss": 1.267, "step": 16731 }, { "epoch": 0.5, "learning_rate": 2.588646351062766e-06, "loss": 1.1302, "step": 16732 }, { "epoch": 0.5, "learning_rate": 2.5884025839825106e-06, "loss": 1.1801, "step": 16733 }, { "epoch": 0.5, "learning_rate": 2.5881588160607045e-06, "loss": 1.0269, "step": 16734 }, { "epoch": 0.5, "learning_rate": 2.5879150472996695e-06, "loss": 1.1744, "step": 16735 }, { "epoch": 0.5, "learning_rate": 2.5876712777017254e-06, "loss": 1.1754, "step": 16736 }, { "epoch": 0.5, "learning_rate": 2.587427507269193e-06, "loss": 1.1991, "step": 16737 }, { "epoch": 0.5, "learning_rate": 2.5871837360043934e-06, "loss": 1.2144, "step": 16738 }, { "epoch": 0.5, "learning_rate": 2.586939963909646e-06, "loss": 1.1179, "step": 16739 }, { "epoch": 0.5, "learning_rate": 2.5866961909872725e-06, "loss": 1.0918, "step": 16740 }, { "epoch": 0.5, "learning_rate": 2.5864524172395924e-06, "loss": 1.0362, "step": 16741 }, { "epoch": 0.5, "learning_rate": 2.5862086426689275e-06, "loss": 1.1778, "step": 16742 }, { "epoch": 0.5, "learning_rate": 2.5859648672775973e-06, "loss": 1.1042, "step": 16743 }, { "epoch": 0.5, "learning_rate": 2.585721091067923e-06, "loss": 1.2343, "step": 16744 }, { "epoch": 0.5, "learning_rate": 2.5854773140422256e-06, "loss": 1.1088, "step": 16745 }, { "epoch": 0.5, "learning_rate": 2.5852335362028254e-06, "loss": 1.1133, "step": 16746 }, { "epoch": 0.5, "learning_rate": 2.584989757552042e-06, "loss": 1.1143, "step": 16747 }, { "epoch": 0.5, "learning_rate": 2.584745978092198e-06, "loss": 1.0395, "step": 16748 }, { "epoch": 0.5, "learning_rate": 2.584502197825613e-06, "loss": 1.1476, "step": 16749 }, { "epoch": 0.5, "learning_rate": 2.5842584167546076e-06, "loss": 1.1534, "step": 16750 }, { "epoch": 0.5, "learning_rate": 2.5840146348815026e-06, "loss": 1.164, "step": 16751 }, { "epoch": 0.5, "learning_rate": 2.5837708522086186e-06, "loss": 1.0822, "step": 16752 }, { "epoch": 0.5, "learning_rate": 2.5835270687382776e-06, "loss": 1.2137, "step": 16753 }, { "epoch": 0.5, "learning_rate": 2.583283284472798e-06, "loss": 1.0349, "step": 16754 }, { "epoch": 0.5, "learning_rate": 2.583039499414502e-06, "loss": 1.0617, "step": 16755 }, { "epoch": 0.5, "learning_rate": 2.5827957135657093e-06, "loss": 1.1553, "step": 16756 }, { "epoch": 0.5, "learning_rate": 2.582551926928742e-06, "loss": 1.0775, "step": 16757 }, { "epoch": 0.5, "learning_rate": 2.5823081395059203e-06, "loss": 1.2025, "step": 16758 }, { "epoch": 0.5, "learning_rate": 2.5820643512995636e-06, "loss": 1.1393, "step": 16759 }, { "epoch": 0.5, "learning_rate": 2.5818205623119947e-06, "loss": 1.113, "step": 16760 }, { "epoch": 0.5, "learning_rate": 2.5815767725455333e-06, "loss": 1.3136, "step": 16761 }, { "epoch": 0.5, "learning_rate": 2.5813329820025e-06, "loss": 1.1371, "step": 16762 }, { "epoch": 0.5, "learning_rate": 2.5810891906852163e-06, "loss": 0.9639, "step": 16763 }, { "epoch": 0.51, "learning_rate": 2.5808453985960025e-06, "loss": 1.2301, "step": 16764 }, { "epoch": 0.51, "learning_rate": 2.5806016057371797e-06, "loss": 1.1335, "step": 16765 }, { "epoch": 0.51, "learning_rate": 2.580357812111068e-06, "loss": 0.9995, "step": 16766 }, { "epoch": 0.51, "learning_rate": 2.5801140177199886e-06, "loss": 1.0784, "step": 16767 }, { "epoch": 0.51, "learning_rate": 2.579870222566263e-06, "loss": 1.1646, "step": 16768 }, { "epoch": 0.51, "learning_rate": 2.579626426652211e-06, "loss": 1.17, "step": 16769 }, { "epoch": 0.51, "learning_rate": 2.579382629980153e-06, "loss": 1.1572, "step": 16770 }, { "epoch": 0.51, "learning_rate": 2.5791388325524114e-06, "loss": 1.1202, "step": 16771 }, { "epoch": 0.51, "learning_rate": 2.5788950343713058e-06, "loss": 1.1255, "step": 16772 }, { "epoch": 0.51, "learning_rate": 2.5786512354391584e-06, "loss": 1.1921, "step": 16773 }, { "epoch": 0.51, "learning_rate": 2.578407435758288e-06, "loss": 1.1093, "step": 16774 }, { "epoch": 0.51, "learning_rate": 2.5781636353310167e-06, "loss": 1.0077, "step": 16775 }, { "epoch": 0.51, "learning_rate": 2.577919834159666e-06, "loss": 1.0513, "step": 16776 }, { "epoch": 0.51, "learning_rate": 2.5776760322465554e-06, "loss": 1.1013, "step": 16777 }, { "epoch": 0.51, "learning_rate": 2.5774322295940064e-06, "loss": 1.1082, "step": 16778 }, { "epoch": 0.51, "learning_rate": 2.57718842620434e-06, "loss": 1.2587, "step": 16779 }, { "epoch": 0.51, "learning_rate": 2.576944622079877e-06, "loss": 1.1735, "step": 16780 }, { "epoch": 0.51, "learning_rate": 2.5767008172229384e-06, "loss": 1.1837, "step": 16781 }, { "epoch": 0.51, "learning_rate": 2.5764570116358446e-06, "loss": 1.1198, "step": 16782 }, { "epoch": 0.51, "learning_rate": 2.576213205320918e-06, "loss": 1.1951, "step": 16783 }, { "epoch": 0.51, "learning_rate": 2.575969398280477e-06, "loss": 1.0488, "step": 16784 }, { "epoch": 0.51, "learning_rate": 2.575725590516844e-06, "loss": 1.2521, "step": 16785 }, { "epoch": 0.51, "learning_rate": 2.57548178203234e-06, "loss": 1.1577, "step": 16786 }, { "epoch": 0.51, "learning_rate": 2.575237972829286e-06, "loss": 1.1749, "step": 16787 }, { "epoch": 0.51, "learning_rate": 2.5749941629100028e-06, "loss": 1.0553, "step": 16788 }, { "epoch": 0.51, "learning_rate": 2.574750352276811e-06, "loss": 1.036, "step": 16789 }, { "epoch": 0.51, "learning_rate": 2.5745065409320324e-06, "loss": 1.1171, "step": 16790 }, { "epoch": 0.51, "learning_rate": 2.5742627288779865e-06, "loss": 1.1718, "step": 16791 }, { "epoch": 0.51, "learning_rate": 2.5740189161169967e-06, "loss": 1.1383, "step": 16792 }, { "epoch": 0.51, "learning_rate": 2.5737751026513805e-06, "loss": 1.1277, "step": 16793 }, { "epoch": 0.51, "learning_rate": 2.5735312884834623e-06, "loss": 1.1516, "step": 16794 }, { "epoch": 0.51, "learning_rate": 2.573287473615561e-06, "loss": 1.0837, "step": 16795 }, { "epoch": 0.51, "learning_rate": 2.573043658049999e-06, "loss": 1.0162, "step": 16796 }, { "epoch": 0.51, "learning_rate": 2.572799841789096e-06, "loss": 1.2064, "step": 16797 }, { "epoch": 0.51, "learning_rate": 2.5725560248351735e-06, "loss": 1.2227, "step": 16798 }, { "epoch": 0.51, "learning_rate": 2.5723122071905526e-06, "loss": 1.2068, "step": 16799 }, { "epoch": 0.51, "learning_rate": 2.5720683888575544e-06, "loss": 0.9722, "step": 16800 }, { "epoch": 0.51, "learning_rate": 2.5718245698384997e-06, "loss": 1.1746, "step": 16801 }, { "epoch": 0.51, "learning_rate": 2.57158075013571e-06, "loss": 1.1303, "step": 16802 }, { "epoch": 0.51, "learning_rate": 2.5713369297515057e-06, "loss": 1.1706, "step": 16803 }, { "epoch": 0.51, "learning_rate": 2.5710931086882077e-06, "loss": 1.201, "step": 16804 }, { "epoch": 0.51, "learning_rate": 2.570849286948139e-06, "loss": 1.2168, "step": 16805 }, { "epoch": 0.51, "learning_rate": 2.570605464533618e-06, "loss": 1.0879, "step": 16806 }, { "epoch": 0.51, "learning_rate": 2.570361641446968e-06, "loss": 1.1945, "step": 16807 }, { "epoch": 0.51, "learning_rate": 2.5701178176905084e-06, "loss": 1.0551, "step": 16808 }, { "epoch": 0.51, "learning_rate": 2.569873993266561e-06, "loss": 1.1772, "step": 16809 }, { "epoch": 0.51, "learning_rate": 2.5696301681774467e-06, "loss": 1.059, "step": 16810 }, { "epoch": 0.51, "learning_rate": 2.569386342425487e-06, "loss": 1.2003, "step": 16811 }, { "epoch": 0.51, "learning_rate": 2.5691425160130025e-06, "loss": 1.0834, "step": 16812 }, { "epoch": 0.51, "learning_rate": 2.5688986889423144e-06, "loss": 1.1256, "step": 16813 }, { "epoch": 0.51, "learning_rate": 2.5686548612157445e-06, "loss": 1.1407, "step": 16814 }, { "epoch": 0.51, "learning_rate": 2.5684110328356133e-06, "loss": 1.0648, "step": 16815 }, { "epoch": 0.51, "learning_rate": 2.5681672038042417e-06, "loss": 1.1103, "step": 16816 }, { "epoch": 0.51, "learning_rate": 2.5679233741239505e-06, "loss": 1.1175, "step": 16817 }, { "epoch": 0.51, "learning_rate": 2.567679543797063e-06, "loss": 1.1467, "step": 16818 }, { "epoch": 0.51, "learning_rate": 2.5674357128258975e-06, "loss": 1.1351, "step": 16819 }, { "epoch": 0.51, "learning_rate": 2.567191881212778e-06, "loss": 1.176, "step": 16820 }, { "epoch": 0.51, "learning_rate": 2.566948048960023e-06, "loss": 1.0549, "step": 16821 }, { "epoch": 0.51, "learning_rate": 2.566704216069955e-06, "loss": 1.0185, "step": 16822 }, { "epoch": 0.51, "learning_rate": 2.5664603825448946e-06, "loss": 1.1284, "step": 16823 }, { "epoch": 0.51, "learning_rate": 2.566216548387164e-06, "loss": 1.1334, "step": 16824 }, { "epoch": 0.51, "learning_rate": 2.5659727135990836e-06, "loss": 1.0963, "step": 16825 }, { "epoch": 0.51, "learning_rate": 2.565728878182975e-06, "loss": 1.0482, "step": 16826 }, { "epoch": 0.51, "learning_rate": 2.565485042141159e-06, "loss": 1.0534, "step": 16827 }, { "epoch": 0.51, "learning_rate": 2.565241205475956e-06, "loss": 1.164, "step": 16828 }, { "epoch": 0.51, "learning_rate": 2.564997368189689e-06, "loss": 1.2064, "step": 16829 }, { "epoch": 0.51, "learning_rate": 2.5647535302846782e-06, "loss": 1.2422, "step": 16830 }, { "epoch": 0.51, "learning_rate": 2.5645096917632456e-06, "loss": 1.1141, "step": 16831 }, { "epoch": 0.51, "learning_rate": 2.564265852627711e-06, "loss": 1.1448, "step": 16832 }, { "epoch": 0.51, "learning_rate": 2.5640220128803965e-06, "loss": 1.0131, "step": 16833 }, { "epoch": 0.51, "learning_rate": 2.563778172523624e-06, "loss": 1.0567, "step": 16834 }, { "epoch": 0.51, "learning_rate": 2.5635343315597133e-06, "loss": 1.1666, "step": 16835 }, { "epoch": 0.51, "learning_rate": 2.5632904899909864e-06, "loss": 1.1031, "step": 16836 }, { "epoch": 0.51, "learning_rate": 2.5630466478197646e-06, "loss": 1.0439, "step": 16837 }, { "epoch": 0.51, "learning_rate": 2.5628028050483696e-06, "loss": 1.0814, "step": 16838 }, { "epoch": 0.51, "learning_rate": 2.5625589616791213e-06, "loss": 1.0477, "step": 16839 }, { "epoch": 0.51, "learning_rate": 2.5623151177143424e-06, "loss": 1.1525, "step": 16840 }, { "epoch": 0.51, "learning_rate": 2.5620712731563537e-06, "loss": 1.163, "step": 16841 }, { "epoch": 0.51, "learning_rate": 2.5618274280074756e-06, "loss": 1.1508, "step": 16842 }, { "epoch": 0.51, "learning_rate": 2.5615835822700304e-06, "loss": 1.08, "step": 16843 }, { "epoch": 0.51, "learning_rate": 2.5613397359463393e-06, "loss": 1.1271, "step": 16844 }, { "epoch": 0.51, "learning_rate": 2.561095889038724e-06, "loss": 1.0839, "step": 16845 }, { "epoch": 0.51, "learning_rate": 2.560852041549505e-06, "loss": 1.2415, "step": 16846 }, { "epoch": 0.51, "learning_rate": 2.5606081934810034e-06, "loss": 1.1419, "step": 16847 }, { "epoch": 0.51, "learning_rate": 2.5603643448355416e-06, "loss": 1.009, "step": 16848 }, { "epoch": 0.51, "learning_rate": 2.5601204956154395e-06, "loss": 1.1767, "step": 16849 }, { "epoch": 0.51, "learning_rate": 2.5598766458230197e-06, "loss": 1.2078, "step": 16850 }, { "epoch": 0.51, "learning_rate": 2.559632795460603e-06, "loss": 1.1092, "step": 16851 }, { "epoch": 0.51, "learning_rate": 2.559388944530511e-06, "loss": 1.0172, "step": 16852 }, { "epoch": 0.51, "learning_rate": 2.559145093035065e-06, "loss": 1.0823, "step": 16853 }, { "epoch": 0.51, "learning_rate": 2.558901240976586e-06, "loss": 1.177, "step": 16854 }, { "epoch": 0.51, "learning_rate": 2.5586573883573956e-06, "loss": 1.1772, "step": 16855 }, { "epoch": 0.51, "learning_rate": 2.5584135351798145e-06, "loss": 1.1646, "step": 16856 }, { "epoch": 0.51, "learning_rate": 2.5581696814461652e-06, "loss": 1.1398, "step": 16857 }, { "epoch": 0.51, "learning_rate": 2.557925827158768e-06, "loss": 1.106, "step": 16858 }, { "epoch": 0.51, "learning_rate": 2.557681972319946e-06, "loss": 1.0331, "step": 16859 }, { "epoch": 0.51, "learning_rate": 2.5574381169320184e-06, "loss": 1.1465, "step": 16860 }, { "epoch": 0.51, "learning_rate": 2.5571942609973082e-06, "loss": 1.1821, "step": 16861 }, { "epoch": 0.51, "learning_rate": 2.556950404518136e-06, "loss": 1.1644, "step": 16862 }, { "epoch": 0.51, "learning_rate": 2.5567065474968227e-06, "loss": 1.2087, "step": 16863 }, { "epoch": 0.51, "learning_rate": 2.5564626899356915e-06, "loss": 1.1661, "step": 16864 }, { "epoch": 0.51, "learning_rate": 2.5562188318370617e-06, "loss": 1.1578, "step": 16865 }, { "epoch": 0.51, "learning_rate": 2.555974973203257e-06, "loss": 1.1328, "step": 16866 }, { "epoch": 0.51, "learning_rate": 2.5557311140365964e-06, "loss": 1.1846, "step": 16867 }, { "epoch": 0.51, "learning_rate": 2.5554872543394028e-06, "loss": 1.1182, "step": 16868 }, { "epoch": 0.51, "learning_rate": 2.555243394113997e-06, "loss": 1.2904, "step": 16869 }, { "epoch": 0.51, "learning_rate": 2.5549995333627008e-06, "loss": 1.0657, "step": 16870 }, { "epoch": 0.51, "learning_rate": 2.5547556720878354e-06, "loss": 1.105, "step": 16871 }, { "epoch": 0.51, "learning_rate": 2.5545118102917225e-06, "loss": 1.106, "step": 16872 }, { "epoch": 0.51, "learning_rate": 2.5542679479766833e-06, "loss": 1.1221, "step": 16873 }, { "epoch": 0.51, "learning_rate": 2.5540240851450405e-06, "loss": 1.0092, "step": 16874 }, { "epoch": 0.51, "learning_rate": 2.553780221799113e-06, "loss": 1.2045, "step": 16875 }, { "epoch": 0.51, "learning_rate": 2.553536357941224e-06, "loss": 1.1362, "step": 16876 }, { "epoch": 0.51, "learning_rate": 2.5532924935736954e-06, "loss": 1.17, "step": 16877 }, { "epoch": 0.51, "learning_rate": 2.5530486286988472e-06, "loss": 1.094, "step": 16878 }, { "epoch": 0.51, "learning_rate": 2.552804763319002e-06, "loss": 1.1139, "step": 16879 }, { "epoch": 0.51, "learning_rate": 2.55256089743648e-06, "loss": 1.0737, "step": 16880 }, { "epoch": 0.51, "learning_rate": 2.552317031053605e-06, "loss": 1.0607, "step": 16881 }, { "epoch": 0.51, "learning_rate": 2.5520731641726958e-06, "loss": 1.0477, "step": 16882 }, { "epoch": 0.51, "learning_rate": 2.5518292967960757e-06, "loss": 1.1622, "step": 16883 }, { "epoch": 0.51, "learning_rate": 2.551585428926065e-06, "loss": 1.0882, "step": 16884 }, { "epoch": 0.51, "learning_rate": 2.551341560564987e-06, "loss": 1.1725, "step": 16885 }, { "epoch": 0.51, "learning_rate": 2.5510976917151616e-06, "loss": 1.2616, "step": 16886 }, { "epoch": 0.51, "learning_rate": 2.550853822378911e-06, "loss": 1.0623, "step": 16887 }, { "epoch": 0.51, "learning_rate": 2.550609952558556e-06, "loss": 1.2084, "step": 16888 }, { "epoch": 0.51, "learning_rate": 2.550366082256419e-06, "loss": 1.2184, "step": 16889 }, { "epoch": 0.51, "learning_rate": 2.550122211474821e-06, "loss": 1.0699, "step": 16890 }, { "epoch": 0.51, "learning_rate": 2.5498783402160833e-06, "loss": 1.0677, "step": 16891 }, { "epoch": 0.51, "learning_rate": 2.5496344684825286e-06, "loss": 1.2279, "step": 16892 }, { "epoch": 0.51, "learning_rate": 2.549390596276477e-06, "loss": 1.2598, "step": 16893 }, { "epoch": 0.51, "learning_rate": 2.549146723600251e-06, "loss": 1.1896, "step": 16894 }, { "epoch": 0.51, "learning_rate": 2.548902850456172e-06, "loss": 1.1022, "step": 16895 }, { "epoch": 0.51, "learning_rate": 2.5486589768465613e-06, "loss": 1.0935, "step": 16896 }, { "epoch": 0.51, "learning_rate": 2.5484151027737404e-06, "loss": 1.1633, "step": 16897 }, { "epoch": 0.51, "learning_rate": 2.548171228240031e-06, "loss": 1.1556, "step": 16898 }, { "epoch": 0.51, "learning_rate": 2.5479273532477544e-06, "loss": 1.1531, "step": 16899 }, { "epoch": 0.51, "learning_rate": 2.547683477799234e-06, "loss": 1.1022, "step": 16900 }, { "epoch": 0.51, "learning_rate": 2.5474396018967884e-06, "loss": 1.0534, "step": 16901 }, { "epoch": 0.51, "learning_rate": 2.547195725542741e-06, "loss": 1.2067, "step": 16902 }, { "epoch": 0.51, "learning_rate": 2.546951848739413e-06, "loss": 1.1054, "step": 16903 }, { "epoch": 0.51, "learning_rate": 2.546707971489126e-06, "loss": 1.0269, "step": 16904 }, { "epoch": 0.51, "learning_rate": 2.546464093794202e-06, "loss": 1.3103, "step": 16905 }, { "epoch": 0.51, "learning_rate": 2.5462202156569613e-06, "loss": 1.2315, "step": 16906 }, { "epoch": 0.51, "learning_rate": 2.5459763370797273e-06, "loss": 0.9824, "step": 16907 }, { "epoch": 0.51, "learning_rate": 2.5457324580648207e-06, "loss": 1.0886, "step": 16908 }, { "epoch": 0.51, "learning_rate": 2.545488578614563e-06, "loss": 1.0801, "step": 16909 }, { "epoch": 0.51, "learning_rate": 2.5452446987312757e-06, "loss": 0.9553, "step": 16910 }, { "epoch": 0.51, "learning_rate": 2.54500081841728e-06, "loss": 1.1548, "step": 16911 }, { "epoch": 0.51, "learning_rate": 2.5447569376748995e-06, "loss": 1.1169, "step": 16912 }, { "epoch": 0.51, "learning_rate": 2.544513056506454e-06, "loss": 1.1281, "step": 16913 }, { "epoch": 0.51, "learning_rate": 2.544269174914265e-06, "loss": 1.1248, "step": 16914 }, { "epoch": 0.51, "learning_rate": 2.544025292900656e-06, "loss": 1.1214, "step": 16915 }, { "epoch": 0.51, "learning_rate": 2.5437814104679465e-06, "loss": 1.0798, "step": 16916 }, { "epoch": 0.51, "learning_rate": 2.543537527618459e-06, "loss": 1.1374, "step": 16917 }, { "epoch": 0.51, "learning_rate": 2.543293644354516e-06, "loss": 1.1172, "step": 16918 }, { "epoch": 0.51, "learning_rate": 2.5430497606784375e-06, "loss": 1.1245, "step": 16919 }, { "epoch": 0.51, "learning_rate": 2.5428058765925467e-06, "loss": 1.1091, "step": 16920 }, { "epoch": 0.51, "learning_rate": 2.5425619920991645e-06, "loss": 1.1342, "step": 16921 }, { "epoch": 0.51, "learning_rate": 2.5423181072006125e-06, "loss": 1.1647, "step": 16922 }, { "epoch": 0.51, "learning_rate": 2.5420742218992125e-06, "loss": 1.2114, "step": 16923 }, { "epoch": 0.51, "learning_rate": 2.5418303361972857e-06, "loss": 1.1112, "step": 16924 }, { "epoch": 0.51, "learning_rate": 2.5415864500971544e-06, "loss": 1.1374, "step": 16925 }, { "epoch": 0.51, "learning_rate": 2.5413425636011406e-06, "loss": 1.1655, "step": 16926 }, { "epoch": 0.51, "learning_rate": 2.541098676711565e-06, "loss": 1.1411, "step": 16927 }, { "epoch": 0.51, "learning_rate": 2.5408547894307505e-06, "loss": 1.1069, "step": 16928 }, { "epoch": 0.51, "learning_rate": 2.5406109017610175e-06, "loss": 1.1164, "step": 16929 }, { "epoch": 0.51, "learning_rate": 2.540367013704688e-06, "loss": 1.1074, "step": 16930 }, { "epoch": 0.51, "learning_rate": 2.5401231252640845e-06, "loss": 1.0663, "step": 16931 }, { "epoch": 0.51, "learning_rate": 2.5398792364415283e-06, "loss": 1.1138, "step": 16932 }, { "epoch": 0.51, "learning_rate": 2.539635347239341e-06, "loss": 1.1048, "step": 16933 }, { "epoch": 0.51, "learning_rate": 2.5393914576598433e-06, "loss": 1.0787, "step": 16934 }, { "epoch": 0.51, "learning_rate": 2.539147567705359e-06, "loss": 1.1334, "step": 16935 }, { "epoch": 0.51, "learning_rate": 2.5389036773782083e-06, "loss": 1.046, "step": 16936 }, { "epoch": 0.51, "learning_rate": 2.5386597866807138e-06, "loss": 1.1266, "step": 16937 }, { "epoch": 0.51, "learning_rate": 2.538415895615196e-06, "loss": 1.1152, "step": 16938 }, { "epoch": 0.51, "learning_rate": 2.5381720041839774e-06, "loss": 1.1248, "step": 16939 }, { "epoch": 0.51, "learning_rate": 2.5379281123893796e-06, "loss": 1.1107, "step": 16940 }, { "epoch": 0.51, "learning_rate": 2.5376842202337254e-06, "loss": 1.1199, "step": 16941 }, { "epoch": 0.51, "learning_rate": 2.537440327719334e-06, "loss": 1.1827, "step": 16942 }, { "epoch": 0.51, "learning_rate": 2.53719643484853e-06, "loss": 1.1319, "step": 16943 }, { "epoch": 0.51, "learning_rate": 2.536952541623634e-06, "loss": 1.0375, "step": 16944 }, { "epoch": 0.51, "learning_rate": 2.5367086480469665e-06, "loss": 1.1227, "step": 16945 }, { "epoch": 0.51, "learning_rate": 2.5364647541208513e-06, "loss": 1.0445, "step": 16946 }, { "epoch": 0.51, "learning_rate": 2.536220859847609e-06, "loss": 1.1775, "step": 16947 }, { "epoch": 0.51, "learning_rate": 2.5359769652295617e-06, "loss": 1.2191, "step": 16948 }, { "epoch": 0.51, "learning_rate": 2.535733070269031e-06, "loss": 1.0822, "step": 16949 }, { "epoch": 0.51, "learning_rate": 2.5354891749683387e-06, "loss": 1.0261, "step": 16950 }, { "epoch": 0.51, "learning_rate": 2.535245279329806e-06, "loss": 1.0534, "step": 16951 }, { "epoch": 0.51, "learning_rate": 2.535001383355755e-06, "loss": 1.1407, "step": 16952 }, { "epoch": 0.51, "learning_rate": 2.534757487048508e-06, "loss": 1.0877, "step": 16953 }, { "epoch": 0.51, "learning_rate": 2.5345135904103875e-06, "loss": 1.1016, "step": 16954 }, { "epoch": 0.51, "learning_rate": 2.534269693443713e-06, "loss": 1.1824, "step": 16955 }, { "epoch": 0.51, "learning_rate": 2.5340257961508076e-06, "loss": 1.1486, "step": 16956 }, { "epoch": 0.51, "learning_rate": 2.5337818985339937e-06, "loss": 1.1141, "step": 16957 }, { "epoch": 0.51, "learning_rate": 2.533538000595592e-06, "loss": 1.1543, "step": 16958 }, { "epoch": 0.51, "learning_rate": 2.533294102337925e-06, "loss": 1.1589, "step": 16959 }, { "epoch": 0.51, "learning_rate": 2.5330502037633137e-06, "loss": 1.2712, "step": 16960 }, { "epoch": 0.51, "learning_rate": 2.532806304874081e-06, "loss": 1.1044, "step": 16961 }, { "epoch": 0.51, "learning_rate": 2.532562405672547e-06, "loss": 1.2213, "step": 16962 }, { "epoch": 0.51, "learning_rate": 2.5323185061610357e-06, "loss": 1.1157, "step": 16963 }, { "epoch": 0.51, "learning_rate": 2.532074606341867e-06, "loss": 1.1951, "step": 16964 }, { "epoch": 0.51, "learning_rate": 2.5318307062173637e-06, "loss": 1.0406, "step": 16965 }, { "epoch": 0.51, "learning_rate": 2.5315868057898476e-06, "loss": 1.1169, "step": 16966 }, { "epoch": 0.51, "learning_rate": 2.53134290506164e-06, "loss": 1.114, "step": 16967 }, { "epoch": 0.51, "learning_rate": 2.5310990040350638e-06, "loss": 1.171, "step": 16968 }, { "epoch": 0.51, "learning_rate": 2.5308551027124396e-06, "loss": 1.025, "step": 16969 }, { "epoch": 0.51, "learning_rate": 2.5306112010960894e-06, "loss": 1.168, "step": 16970 }, { "epoch": 0.51, "learning_rate": 2.5303672991883352e-06, "loss": 1.162, "step": 16971 }, { "epoch": 0.51, "learning_rate": 2.5301233969914994e-06, "loss": 1.1099, "step": 16972 }, { "epoch": 0.51, "learning_rate": 2.529879494507903e-06, "loss": 1.1783, "step": 16973 }, { "epoch": 0.51, "learning_rate": 2.5296355917398692e-06, "loss": 1.1968, "step": 16974 }, { "epoch": 0.51, "learning_rate": 2.5293916886897175e-06, "loss": 1.0269, "step": 16975 }, { "epoch": 0.51, "learning_rate": 2.5291477853597722e-06, "loss": 1.1843, "step": 16976 }, { "epoch": 0.51, "learning_rate": 2.528903881752353e-06, "loss": 1.1017, "step": 16977 }, { "epoch": 0.51, "learning_rate": 2.528659977869784e-06, "loss": 1.1778, "step": 16978 }, { "epoch": 0.51, "learning_rate": 2.5284160737143846e-06, "loss": 1.0893, "step": 16979 }, { "epoch": 0.51, "learning_rate": 2.528172169288478e-06, "loss": 1.0547, "step": 16980 }, { "epoch": 0.51, "learning_rate": 2.5279282645943863e-06, "loss": 1.1668, "step": 16981 }, { "epoch": 0.51, "learning_rate": 2.5276843596344316e-06, "loss": 1.0675, "step": 16982 }, { "epoch": 0.51, "learning_rate": 2.527440454410934e-06, "loss": 1.0985, "step": 16983 }, { "epoch": 0.51, "learning_rate": 2.5271965489262164e-06, "loss": 1.1042, "step": 16984 }, { "epoch": 0.51, "learning_rate": 2.526952643182602e-06, "loss": 1.0486, "step": 16985 }, { "epoch": 0.51, "learning_rate": 2.52670873718241e-06, "loss": 1.1743, "step": 16986 }, { "epoch": 0.51, "learning_rate": 2.526464830927965e-06, "loss": 1.2026, "step": 16987 }, { "epoch": 0.51, "learning_rate": 2.5262209244215867e-06, "loss": 1.1415, "step": 16988 }, { "epoch": 0.51, "learning_rate": 2.5259770176655985e-06, "loss": 1.0746, "step": 16989 }, { "epoch": 0.51, "learning_rate": 2.5257331106623207e-06, "loss": 1.0357, "step": 16990 }, { "epoch": 0.51, "learning_rate": 2.5254892034140773e-06, "loss": 1.2034, "step": 16991 }, { "epoch": 0.51, "learning_rate": 2.5252452959231876e-06, "loss": 1.1888, "step": 16992 }, { "epoch": 0.51, "learning_rate": 2.5250013881919757e-06, "loss": 1.153, "step": 16993 }, { "epoch": 0.51, "learning_rate": 2.524757480222762e-06, "loss": 1.1208, "step": 16994 }, { "epoch": 0.51, "learning_rate": 2.5245135720178697e-06, "loss": 1.0938, "step": 16995 }, { "epoch": 0.51, "learning_rate": 2.5242696635796194e-06, "loss": 1.0666, "step": 16996 }, { "epoch": 0.51, "learning_rate": 2.5240257549103338e-06, "loss": 1.082, "step": 16997 }, { "epoch": 0.51, "learning_rate": 2.523781846012335e-06, "loss": 1.1357, "step": 16998 }, { "epoch": 0.51, "learning_rate": 2.523537936887944e-06, "loss": 1.0784, "step": 16999 }, { "epoch": 0.51, "learning_rate": 2.5232940275394834e-06, "loss": 1.2315, "step": 17000 }, { "epoch": 0.51, "learning_rate": 2.5230501179692744e-06, "loss": 1.1, "step": 17001 }, { "epoch": 0.51, "learning_rate": 2.5228062081796407e-06, "loss": 1.0867, "step": 17002 }, { "epoch": 0.51, "learning_rate": 2.5225622981729015e-06, "loss": 1.1824, "step": 17003 }, { "epoch": 0.51, "learning_rate": 2.522318387951381e-06, "loss": 1.1926, "step": 17004 }, { "epoch": 0.51, "learning_rate": 2.5220744775173995e-06, "loss": 1.2289, "step": 17005 }, { "epoch": 0.51, "learning_rate": 2.5218305668732794e-06, "loss": 1.2656, "step": 17006 }, { "epoch": 0.51, "learning_rate": 2.521586656021343e-06, "loss": 1.0867, "step": 17007 }, { "epoch": 0.51, "learning_rate": 2.521342744963913e-06, "loss": 1.1058, "step": 17008 }, { "epoch": 0.51, "learning_rate": 2.5210988337033094e-06, "loss": 1.0232, "step": 17009 }, { "epoch": 0.51, "learning_rate": 2.520854922241855e-06, "loss": 1.1808, "step": 17010 }, { "epoch": 0.51, "learning_rate": 2.5206110105818722e-06, "loss": 1.1791, "step": 17011 }, { "epoch": 0.51, "learning_rate": 2.5203670987256823e-06, "loss": 1.213, "step": 17012 }, { "epoch": 0.51, "learning_rate": 2.520123186675608e-06, "loss": 1.1181, "step": 17013 }, { "epoch": 0.51, "learning_rate": 2.51987927443397e-06, "loss": 0.9908, "step": 17014 }, { "epoch": 0.51, "learning_rate": 2.519635362003091e-06, "loss": 1.1505, "step": 17015 }, { "epoch": 0.51, "learning_rate": 2.5193914493852926e-06, "loss": 0.979, "step": 17016 }, { "epoch": 0.51, "learning_rate": 2.519147536582898e-06, "loss": 1.1735, "step": 17017 }, { "epoch": 0.51, "learning_rate": 2.5189036235982266e-06, "loss": 1.1096, "step": 17018 }, { "epoch": 0.51, "learning_rate": 2.518659710433603e-06, "loss": 1.0631, "step": 17019 }, { "epoch": 0.51, "learning_rate": 2.5184157970913473e-06, "loss": 1.1489, "step": 17020 }, { "epoch": 0.51, "learning_rate": 2.5181718835737823e-06, "loss": 1.1761, "step": 17021 }, { "epoch": 0.51, "learning_rate": 2.5179279698832294e-06, "loss": 1.1949, "step": 17022 }, { "epoch": 0.51, "learning_rate": 2.517684056022011e-06, "loss": 1.094, "step": 17023 }, { "epoch": 0.51, "learning_rate": 2.5174401419924495e-06, "loss": 1.1719, "step": 17024 }, { "epoch": 0.51, "learning_rate": 2.5171962277968655e-06, "loss": 1.1203, "step": 17025 }, { "epoch": 0.51, "learning_rate": 2.516952313437582e-06, "loss": 1.1163, "step": 17026 }, { "epoch": 0.51, "learning_rate": 2.5167083989169205e-06, "loss": 1.1281, "step": 17027 }, { "epoch": 0.51, "learning_rate": 2.5164644842372034e-06, "loss": 0.9786, "step": 17028 }, { "epoch": 0.51, "learning_rate": 2.5162205694007517e-06, "loss": 1.0874, "step": 17029 }, { "epoch": 0.51, "learning_rate": 2.515976654409889e-06, "loss": 1.1829, "step": 17030 }, { "epoch": 0.51, "learning_rate": 2.5157327392669354e-06, "loss": 1.2039, "step": 17031 }, { "epoch": 0.51, "learning_rate": 2.515488823974214e-06, "loss": 1.1813, "step": 17032 }, { "epoch": 0.51, "learning_rate": 2.515244908534046e-06, "loss": 1.0935, "step": 17033 }, { "epoch": 0.51, "learning_rate": 2.5150009929487547e-06, "loss": 1.017, "step": 17034 }, { "epoch": 0.51, "learning_rate": 2.5147570772206602e-06, "loss": 1.1797, "step": 17035 }, { "epoch": 0.51, "learning_rate": 2.5145131613520858e-06, "loss": 1.1468, "step": 17036 }, { "epoch": 0.51, "learning_rate": 2.514269245345354e-06, "loss": 1.0556, "step": 17037 }, { "epoch": 0.51, "learning_rate": 2.514025329202784e-06, "loss": 1.2632, "step": 17038 }, { "epoch": 0.51, "learning_rate": 2.5137814129267014e-06, "loss": 1.1869, "step": 17039 }, { "epoch": 0.51, "learning_rate": 2.5135374965194254e-06, "loss": 1.1, "step": 17040 }, { "epoch": 0.51, "learning_rate": 2.5132935799832797e-06, "loss": 1.1628, "step": 17041 }, { "epoch": 0.51, "learning_rate": 2.5130496633205848e-06, "loss": 1.1387, "step": 17042 }, { "epoch": 0.51, "learning_rate": 2.512805746533664e-06, "loss": 1.0894, "step": 17043 }, { "epoch": 0.51, "learning_rate": 2.5125618296248382e-06, "loss": 1.1796, "step": 17044 }, { "epoch": 0.51, "learning_rate": 2.5123179125964305e-06, "loss": 1.0958, "step": 17045 }, { "epoch": 0.51, "learning_rate": 2.512073995450761e-06, "loss": 1.124, "step": 17046 }, { "epoch": 0.51, "learning_rate": 2.5118300781901533e-06, "loss": 1.1486, "step": 17047 }, { "epoch": 0.51, "learning_rate": 2.511586160816929e-06, "loss": 1.173, "step": 17048 }, { "epoch": 0.51, "learning_rate": 2.5113422433334104e-06, "loss": 1.1555, "step": 17049 }, { "epoch": 0.51, "learning_rate": 2.5110983257419193e-06, "loss": 1.081, "step": 17050 }, { "epoch": 0.51, "learning_rate": 2.5108544080447765e-06, "loss": 1.0911, "step": 17051 }, { "epoch": 0.51, "learning_rate": 2.5106104902443058e-06, "loss": 1.1516, "step": 17052 }, { "epoch": 0.51, "learning_rate": 2.5103665723428277e-06, "loss": 1.0676, "step": 17053 }, { "epoch": 0.51, "learning_rate": 2.510122654342666e-06, "loss": 1.1047, "step": 17054 }, { "epoch": 0.51, "learning_rate": 2.5098787362461404e-06, "loss": 1.2327, "step": 17055 }, { "epoch": 0.51, "learning_rate": 2.5096348180555746e-06, "loss": 1.0649, "step": 17056 }, { "epoch": 0.51, "learning_rate": 2.5093908997732896e-06, "loss": 1.1119, "step": 17057 }, { "epoch": 0.51, "learning_rate": 2.5091469814016083e-06, "loss": 1.207, "step": 17058 }, { "epoch": 0.51, "learning_rate": 2.508903062942851e-06, "loss": 1.1956, "step": 17059 }, { "epoch": 0.51, "learning_rate": 2.5086591443993424e-06, "loss": 1.1059, "step": 17060 }, { "epoch": 0.51, "learning_rate": 2.5084152257734017e-06, "loss": 1.1335, "step": 17061 }, { "epoch": 0.51, "learning_rate": 2.508171307067352e-06, "loss": 1.1281, "step": 17062 }, { "epoch": 0.51, "learning_rate": 2.507927388283516e-06, "loss": 1.1174, "step": 17063 }, { "epoch": 0.51, "learning_rate": 2.5076834694242146e-06, "loss": 1.1299, "step": 17064 }, { "epoch": 0.51, "learning_rate": 2.507439550491771e-06, "loss": 1.1873, "step": 17065 }, { "epoch": 0.51, "learning_rate": 2.5071956314885053e-06, "loss": 1.2175, "step": 17066 }, { "epoch": 0.51, "learning_rate": 2.506951712416742e-06, "loss": 1.1121, "step": 17067 }, { "epoch": 0.51, "learning_rate": 2.5067077932788008e-06, "loss": 1.1132, "step": 17068 }, { "epoch": 0.51, "learning_rate": 2.506463874077005e-06, "loss": 1.1852, "step": 17069 }, { "epoch": 0.51, "learning_rate": 2.5062199548136768e-06, "loss": 1.0906, "step": 17070 }, { "epoch": 0.51, "learning_rate": 2.505976035491137e-06, "loss": 1.0402, "step": 17071 }, { "epoch": 0.51, "learning_rate": 2.505732116111708e-06, "loss": 0.9911, "step": 17072 }, { "epoch": 0.51, "learning_rate": 2.5054881966777127e-06, "loss": 1.0978, "step": 17073 }, { "epoch": 0.51, "learning_rate": 2.505244277191472e-06, "loss": 1.3107, "step": 17074 }, { "epoch": 0.51, "learning_rate": 2.505000357655308e-06, "loss": 1.1939, "step": 17075 }, { "epoch": 0.51, "learning_rate": 2.504756438071543e-06, "loss": 1.1889, "step": 17076 }, { "epoch": 0.51, "learning_rate": 2.504512518442499e-06, "loss": 1.1443, "step": 17077 }, { "epoch": 0.51, "learning_rate": 2.504268598770499e-06, "loss": 1.0928, "step": 17078 }, { "epoch": 0.51, "learning_rate": 2.5040246790578624e-06, "loss": 1.1179, "step": 17079 }, { "epoch": 0.51, "learning_rate": 2.5037807593069146e-06, "loss": 1.1792, "step": 17080 }, { "epoch": 0.51, "learning_rate": 2.503536839519974e-06, "loss": 1.1233, "step": 17081 }, { "epoch": 0.51, "learning_rate": 2.503292919699366e-06, "loss": 1.166, "step": 17082 }, { "epoch": 0.51, "learning_rate": 2.50304899984741e-06, "loss": 1.1432, "step": 17083 }, { "epoch": 0.51, "learning_rate": 2.5028050799664298e-06, "loss": 1.1161, "step": 17084 }, { "epoch": 0.51, "learning_rate": 2.5025611600587457e-06, "loss": 1.0863, "step": 17085 }, { "epoch": 0.51, "learning_rate": 2.5023172401266814e-06, "loss": 1.1523, "step": 17086 }, { "epoch": 0.51, "learning_rate": 2.502073320172557e-06, "loss": 1.1868, "step": 17087 }, { "epoch": 0.51, "learning_rate": 2.5018294001986964e-06, "loss": 1.1208, "step": 17088 }, { "epoch": 0.51, "learning_rate": 2.5015854802074203e-06, "loss": 1.2918, "step": 17089 }, { "epoch": 0.51, "learning_rate": 2.5013415602010514e-06, "loss": 1.0529, "step": 17090 }, { "epoch": 0.51, "learning_rate": 2.501097640181912e-06, "loss": 1.0916, "step": 17091 }, { "epoch": 0.51, "learning_rate": 2.500853720152323e-06, "loss": 1.2014, "step": 17092 }, { "epoch": 0.51, "learning_rate": 2.500609800114607e-06, "loss": 1.1454, "step": 17093 }, { "epoch": 0.51, "learning_rate": 2.500365880071086e-06, "loss": 1.1411, "step": 17094 }, { "epoch": 0.51, "learning_rate": 2.500121960024083e-06, "loss": 1.1296, "step": 17095 }, { "epoch": 0.52, "learning_rate": 2.499878039975918e-06, "loss": 1.067, "step": 17096 }, { "epoch": 0.52, "learning_rate": 2.499634119928914e-06, "loss": 1.023, "step": 17097 }, { "epoch": 0.52, "learning_rate": 2.499390199885394e-06, "loss": 1.1268, "step": 17098 }, { "epoch": 0.52, "learning_rate": 2.4991462798476777e-06, "loss": 1.1094, "step": 17099 }, { "epoch": 0.52, "learning_rate": 2.498902359818089e-06, "loss": 1.1359, "step": 17100 }, { "epoch": 0.52, "learning_rate": 2.498658439798949e-06, "loss": 1.1796, "step": 17101 }, { "epoch": 0.52, "learning_rate": 2.49841451979258e-06, "loss": 1.1571, "step": 17102 }, { "epoch": 0.52, "learning_rate": 2.4981705998013044e-06, "loss": 1.185, "step": 17103 }, { "epoch": 0.52, "learning_rate": 2.4979266798274433e-06, "loss": 1.097, "step": 17104 }, { "epoch": 0.52, "learning_rate": 2.4976827598733194e-06, "loss": 1.243, "step": 17105 }, { "epoch": 0.52, "learning_rate": 2.4974388399412543e-06, "loss": 1.0846, "step": 17106 }, { "epoch": 0.52, "learning_rate": 2.4971949200335715e-06, "loss": 1.0538, "step": 17107 }, { "epoch": 0.52, "learning_rate": 2.4969510001525906e-06, "loss": 1.1873, "step": 17108 }, { "epoch": 0.52, "learning_rate": 2.4967070803006345e-06, "loss": 1.1156, "step": 17109 }, { "epoch": 0.52, "learning_rate": 2.4964631604800258e-06, "loss": 1.1785, "step": 17110 }, { "epoch": 0.52, "learning_rate": 2.4962192406930867e-06, "loss": 1.1476, "step": 17111 }, { "epoch": 0.52, "learning_rate": 2.495975320942138e-06, "loss": 1.2319, "step": 17112 }, { "epoch": 0.52, "learning_rate": 2.495731401229502e-06, "loss": 1.2013, "step": 17113 }, { "epoch": 0.52, "learning_rate": 2.4954874815575013e-06, "loss": 1.1197, "step": 17114 }, { "epoch": 0.52, "learning_rate": 2.4952435619284576e-06, "loss": 1.1794, "step": 17115 }, { "epoch": 0.52, "learning_rate": 2.494999642344693e-06, "loss": 1.0235, "step": 17116 }, { "epoch": 0.52, "learning_rate": 2.494755722808529e-06, "loss": 1.1246, "step": 17117 }, { "epoch": 0.52, "learning_rate": 2.4945118033222877e-06, "loss": 1.06, "step": 17118 }, { "epoch": 0.52, "learning_rate": 2.494267883888292e-06, "loss": 1.1363, "step": 17119 }, { "epoch": 0.52, "learning_rate": 2.4940239645088642e-06, "loss": 1.1454, "step": 17120 }, { "epoch": 0.52, "learning_rate": 2.493780045186324e-06, "loss": 1.1636, "step": 17121 }, { "epoch": 0.52, "learning_rate": 2.4935361259229953e-06, "loss": 1.0588, "step": 17122 }, { "epoch": 0.52, "learning_rate": 2.4932922067211992e-06, "loss": 1.2533, "step": 17123 }, { "epoch": 0.52, "learning_rate": 2.4930482875832593e-06, "loss": 1.285, "step": 17124 }, { "epoch": 0.52, "learning_rate": 2.492804368511495e-06, "loss": 1.1109, "step": 17125 }, { "epoch": 0.52, "learning_rate": 2.49256044950823e-06, "loss": 1.0671, "step": 17126 }, { "epoch": 0.52, "learning_rate": 2.4923165305757858e-06, "loss": 1.1245, "step": 17127 }, { "epoch": 0.52, "learning_rate": 2.492072611716485e-06, "loss": 1.1021, "step": 17128 }, { "epoch": 0.52, "learning_rate": 2.4918286929326484e-06, "loss": 1.0483, "step": 17129 }, { "epoch": 0.52, "learning_rate": 2.491584774226599e-06, "loss": 1.2739, "step": 17130 }, { "epoch": 0.52, "learning_rate": 2.4913408556006584e-06, "loss": 1.095, "step": 17131 }, { "epoch": 0.52, "learning_rate": 2.4910969370571493e-06, "loss": 1.093, "step": 17132 }, { "epoch": 0.52, "learning_rate": 2.490853018598393e-06, "loss": 1.0969, "step": 17133 }, { "epoch": 0.52, "learning_rate": 2.4906091002267112e-06, "loss": 1.1328, "step": 17134 }, { "epoch": 0.52, "learning_rate": 2.490365181944426e-06, "loss": 1.0925, "step": 17135 }, { "epoch": 0.52, "learning_rate": 2.4901212637538596e-06, "loss": 1.1551, "step": 17136 }, { "epoch": 0.52, "learning_rate": 2.4898773456573352e-06, "loss": 1.0383, "step": 17137 }, { "epoch": 0.52, "learning_rate": 2.4896334276571727e-06, "loss": 1.1705, "step": 17138 }, { "epoch": 0.52, "learning_rate": 2.4893895097556946e-06, "loss": 1.1861, "step": 17139 }, { "epoch": 0.52, "learning_rate": 2.489145591955224e-06, "loss": 1.0635, "step": 17140 }, { "epoch": 0.52, "learning_rate": 2.488901674258082e-06, "loss": 1.11, "step": 17141 }, { "epoch": 0.52, "learning_rate": 2.48865775666659e-06, "loss": 1.1197, "step": 17142 }, { "epoch": 0.52, "learning_rate": 2.488413839183072e-06, "loss": 1.2203, "step": 17143 }, { "epoch": 0.52, "learning_rate": 2.488169921809847e-06, "loss": 1.0547, "step": 17144 }, { "epoch": 0.52, "learning_rate": 2.4879260045492397e-06, "loss": 1.1157, "step": 17145 }, { "epoch": 0.52, "learning_rate": 2.4876820874035712e-06, "loss": 1.2139, "step": 17146 }, { "epoch": 0.52, "learning_rate": 2.4874381703751626e-06, "loss": 1.1204, "step": 17147 }, { "epoch": 0.52, "learning_rate": 2.487194253466337e-06, "loss": 1.1906, "step": 17148 }, { "epoch": 0.52, "learning_rate": 2.486950336679415e-06, "loss": 1.2451, "step": 17149 }, { "epoch": 0.52, "learning_rate": 2.4867064200167215e-06, "loss": 1.1364, "step": 17150 }, { "epoch": 0.52, "learning_rate": 2.4864625034805754e-06, "loss": 1.2474, "step": 17151 }, { "epoch": 0.52, "learning_rate": 2.4862185870732995e-06, "loss": 1.1098, "step": 17152 }, { "epoch": 0.52, "learning_rate": 2.4859746707972158e-06, "loss": 1.0969, "step": 17153 }, { "epoch": 0.52, "learning_rate": 2.4857307546546478e-06, "loss": 1.1965, "step": 17154 }, { "epoch": 0.52, "learning_rate": 2.485486838647915e-06, "loss": 1.3315, "step": 17155 }, { "epoch": 0.52, "learning_rate": 2.48524292277934e-06, "loss": 1.0782, "step": 17156 }, { "epoch": 0.52, "learning_rate": 2.484999007051246e-06, "loss": 1.1865, "step": 17157 }, { "epoch": 0.52, "learning_rate": 2.4847550914659543e-06, "loss": 1.0425, "step": 17158 }, { "epoch": 0.52, "learning_rate": 2.484511176025787e-06, "loss": 1.1065, "step": 17159 }, { "epoch": 0.52, "learning_rate": 2.4842672607330654e-06, "loss": 1.1662, "step": 17160 }, { "epoch": 0.52, "learning_rate": 2.4840233455901115e-06, "loss": 1.1406, "step": 17161 }, { "epoch": 0.52, "learning_rate": 2.4837794305992482e-06, "loss": 1.2125, "step": 17162 }, { "epoch": 0.52, "learning_rate": 2.483535515762798e-06, "loss": 1.0969, "step": 17163 }, { "epoch": 0.52, "learning_rate": 2.4832916010830803e-06, "loss": 1.1201, "step": 17164 }, { "epoch": 0.52, "learning_rate": 2.4830476865624186e-06, "loss": 1.2188, "step": 17165 }, { "epoch": 0.52, "learning_rate": 2.482803772203135e-06, "loss": 1.1121, "step": 17166 }, { "epoch": 0.52, "learning_rate": 2.482559858007552e-06, "loss": 1.1667, "step": 17167 }, { "epoch": 0.52, "learning_rate": 2.4823159439779896e-06, "loss": 1.039, "step": 17168 }, { "epoch": 0.52, "learning_rate": 2.4820720301167714e-06, "loss": 1.2355, "step": 17169 }, { "epoch": 0.52, "learning_rate": 2.4818281164262185e-06, "loss": 1.1494, "step": 17170 }, { "epoch": 0.52, "learning_rate": 2.481584202908653e-06, "loss": 1.1169, "step": 17171 }, { "epoch": 0.52, "learning_rate": 2.481340289566398e-06, "loss": 1.0823, "step": 17172 }, { "epoch": 0.52, "learning_rate": 2.481096376401774e-06, "loss": 1.1196, "step": 17173 }, { "epoch": 0.52, "learning_rate": 2.4808524634171026e-06, "loss": 1.1756, "step": 17174 }, { "epoch": 0.52, "learning_rate": 2.4806085506147074e-06, "loss": 1.0296, "step": 17175 }, { "epoch": 0.52, "learning_rate": 2.48036463799691e-06, "loss": 0.9722, "step": 17176 }, { "epoch": 0.52, "learning_rate": 2.480120725566031e-06, "loss": 1.2164, "step": 17177 }, { "epoch": 0.52, "learning_rate": 2.4798768133243927e-06, "loss": 1.1415, "step": 17178 }, { "epoch": 0.52, "learning_rate": 2.4796329012743177e-06, "loss": 1.179, "step": 17179 }, { "epoch": 0.52, "learning_rate": 2.479388989418129e-06, "loss": 1.0905, "step": 17180 }, { "epoch": 0.52, "learning_rate": 2.4791450777581458e-06, "loss": 1.0773, "step": 17181 }, { "epoch": 0.52, "learning_rate": 2.478901166296692e-06, "loss": 1.1782, "step": 17182 }, { "epoch": 0.52, "learning_rate": 2.478657255036088e-06, "loss": 1.1432, "step": 17183 }, { "epoch": 0.52, "learning_rate": 2.478413343978657e-06, "loss": 1.0897, "step": 17184 }, { "epoch": 0.52, "learning_rate": 2.478169433126721e-06, "loss": 1.144, "step": 17185 }, { "epoch": 0.52, "learning_rate": 2.4779255224826013e-06, "loss": 1.201, "step": 17186 }, { "epoch": 0.52, "learning_rate": 2.47768161204862e-06, "loss": 1.0972, "step": 17187 }, { "epoch": 0.52, "learning_rate": 2.4774377018270985e-06, "loss": 1.1005, "step": 17188 }, { "epoch": 0.52, "learning_rate": 2.477193791820361e-06, "loss": 1.1873, "step": 17189 }, { "epoch": 0.52, "learning_rate": 2.476949882030726e-06, "loss": 1.0564, "step": 17190 }, { "epoch": 0.52, "learning_rate": 2.476705972460517e-06, "loss": 1.1544, "step": 17191 }, { "epoch": 0.52, "learning_rate": 2.4764620631120566e-06, "loss": 1.1629, "step": 17192 }, { "epoch": 0.52, "learning_rate": 2.4762181539876665e-06, "loss": 1.1143, "step": 17193 }, { "epoch": 0.52, "learning_rate": 2.475974245089667e-06, "loss": 1.2502, "step": 17194 }, { "epoch": 0.52, "learning_rate": 2.4757303364203814e-06, "loss": 1.1193, "step": 17195 }, { "epoch": 0.52, "learning_rate": 2.475486427982131e-06, "loss": 1.1323, "step": 17196 }, { "epoch": 0.52, "learning_rate": 2.4752425197772385e-06, "loss": 1.195, "step": 17197 }, { "epoch": 0.52, "learning_rate": 2.474998611808025e-06, "loss": 1.2512, "step": 17198 }, { "epoch": 0.52, "learning_rate": 2.474754704076813e-06, "loss": 1.1136, "step": 17199 }, { "epoch": 0.52, "learning_rate": 2.4745107965859236e-06, "loss": 1.0002, "step": 17200 }, { "epoch": 0.52, "learning_rate": 2.4742668893376792e-06, "loss": 1.1336, "step": 17201 }, { "epoch": 0.52, "learning_rate": 2.4740229823344028e-06, "loss": 1.1246, "step": 17202 }, { "epoch": 0.52, "learning_rate": 2.473779075578414e-06, "loss": 1.1024, "step": 17203 }, { "epoch": 0.52, "learning_rate": 2.4735351690720356e-06, "loss": 1.0571, "step": 17204 }, { "epoch": 0.52, "learning_rate": 2.4732912628175896e-06, "loss": 0.9731, "step": 17205 }, { "epoch": 0.52, "learning_rate": 2.4730473568173996e-06, "loss": 1.1721, "step": 17206 }, { "epoch": 0.52, "learning_rate": 2.472803451073784e-06, "loss": 1.0867, "step": 17207 }, { "epoch": 0.52, "learning_rate": 2.472559545589067e-06, "loss": 1.1024, "step": 17208 }, { "epoch": 0.52, "learning_rate": 2.4723156403655697e-06, "loss": 1.0591, "step": 17209 }, { "epoch": 0.52, "learning_rate": 2.472071735405614e-06, "loss": 1.0477, "step": 17210 }, { "epoch": 0.52, "learning_rate": 2.4718278307115226e-06, "loss": 1.1089, "step": 17211 }, { "epoch": 0.52, "learning_rate": 2.4715839262856162e-06, "loss": 1.0873, "step": 17212 }, { "epoch": 0.52, "learning_rate": 2.471340022130217e-06, "loss": 1.205, "step": 17213 }, { "epoch": 0.52, "learning_rate": 2.4710961182476475e-06, "loss": 1.1162, "step": 17214 }, { "epoch": 0.52, "learning_rate": 2.470852214640229e-06, "loss": 1.1107, "step": 17215 }, { "epoch": 0.52, "learning_rate": 2.470608311310283e-06, "loss": 1.136, "step": 17216 }, { "epoch": 0.52, "learning_rate": 2.4703644082601316e-06, "loss": 1.1985, "step": 17217 }, { "epoch": 0.52, "learning_rate": 2.470120505492097e-06, "loss": 1.2045, "step": 17218 }, { "epoch": 0.52, "learning_rate": 2.469876603008502e-06, "loss": 1.1392, "step": 17219 }, { "epoch": 0.52, "learning_rate": 2.4696327008116656e-06, "loss": 1.0344, "step": 17220 }, { "epoch": 0.52, "learning_rate": 2.4693887989039115e-06, "loss": 1.1394, "step": 17221 }, { "epoch": 0.52, "learning_rate": 2.4691448972875612e-06, "loss": 1.1363, "step": 17222 }, { "epoch": 0.52, "learning_rate": 2.4689009959649366e-06, "loss": 1.1039, "step": 17223 }, { "epoch": 0.52, "learning_rate": 2.4686570949383602e-06, "loss": 1.186, "step": 17224 }, { "epoch": 0.52, "learning_rate": 2.4684131942101533e-06, "loss": 1.2017, "step": 17225 }, { "epoch": 0.52, "learning_rate": 2.468169293782637e-06, "loss": 1.1057, "step": 17226 }, { "epoch": 0.52, "learning_rate": 2.4679253936581334e-06, "loss": 1.1792, "step": 17227 }, { "epoch": 0.52, "learning_rate": 2.4676814938389656e-06, "loss": 1.0149, "step": 17228 }, { "epoch": 0.52, "learning_rate": 2.4674375943274537e-06, "loss": 1.131, "step": 17229 }, { "epoch": 0.52, "learning_rate": 2.4671936951259203e-06, "loss": 1.1342, "step": 17230 }, { "epoch": 0.52, "learning_rate": 2.4669497962366867e-06, "loss": 1.0499, "step": 17231 }, { "epoch": 0.52, "learning_rate": 2.4667058976620762e-06, "loss": 1.2874, "step": 17232 }, { "epoch": 0.52, "learning_rate": 2.466461999404409e-06, "loss": 1.0408, "step": 17233 }, { "epoch": 0.52, "learning_rate": 2.466218101466007e-06, "loss": 1.0289, "step": 17234 }, { "epoch": 0.52, "learning_rate": 2.4659742038491928e-06, "loss": 1.1442, "step": 17235 }, { "epoch": 0.52, "learning_rate": 2.465730306556287e-06, "loss": 1.2563, "step": 17236 }, { "epoch": 0.52, "learning_rate": 2.4654864095896142e-06, "loss": 1.168, "step": 17237 }, { "epoch": 0.52, "learning_rate": 2.4652425129514926e-06, "loss": 1.0223, "step": 17238 }, { "epoch": 0.52, "learning_rate": 2.4649986166442454e-06, "loss": 1.1225, "step": 17239 }, { "epoch": 0.52, "learning_rate": 2.464754720670195e-06, "loss": 1.1268, "step": 17240 }, { "epoch": 0.52, "learning_rate": 2.4645108250316626e-06, "loss": 1.139, "step": 17241 }, { "epoch": 0.52, "learning_rate": 2.46426692973097e-06, "loss": 1.1687, "step": 17242 }, { "epoch": 0.52, "learning_rate": 2.4640230347704387e-06, "loss": 1.0828, "step": 17243 }, { "epoch": 0.52, "learning_rate": 2.463779140152391e-06, "loss": 1.1186, "step": 17244 }, { "epoch": 0.52, "learning_rate": 2.4635352458791495e-06, "loss": 1.1313, "step": 17245 }, { "epoch": 0.52, "learning_rate": 2.463291351953034e-06, "loss": 1.0878, "step": 17246 }, { "epoch": 0.52, "learning_rate": 2.4630474583763668e-06, "loss": 1.0933, "step": 17247 }, { "epoch": 0.52, "learning_rate": 2.46280356515147e-06, "loss": 1.2039, "step": 17248 }, { "epoch": 0.52, "learning_rate": 2.4625596722806654e-06, "loss": 1.1826, "step": 17249 }, { "epoch": 0.52, "learning_rate": 2.4623157797662763e-06, "loss": 1.1325, "step": 17250 }, { "epoch": 0.52, "learning_rate": 2.462071887610621e-06, "loss": 1.141, "step": 17251 }, { "epoch": 0.52, "learning_rate": 2.4618279958160234e-06, "loss": 1.0182, "step": 17252 }, { "epoch": 0.52, "learning_rate": 2.4615841043848047e-06, "loss": 1.1373, "step": 17253 }, { "epoch": 0.52, "learning_rate": 2.4613402133192875e-06, "loss": 1.1535, "step": 17254 }, { "epoch": 0.52, "learning_rate": 2.4610963226217925e-06, "loss": 1.1138, "step": 17255 }, { "epoch": 0.52, "learning_rate": 2.4608524322946415e-06, "loss": 1.0546, "step": 17256 }, { "epoch": 0.52, "learning_rate": 2.4606085423401566e-06, "loss": 1.1622, "step": 17257 }, { "epoch": 0.52, "learning_rate": 2.4603646527606604e-06, "loss": 1.105, "step": 17258 }, { "epoch": 0.52, "learning_rate": 2.4601207635584725e-06, "loss": 1.0358, "step": 17259 }, { "epoch": 0.52, "learning_rate": 2.4598768747359163e-06, "loss": 1.1511, "step": 17260 }, { "epoch": 0.52, "learning_rate": 2.4596329862953123e-06, "loss": 1.0805, "step": 17261 }, { "epoch": 0.52, "learning_rate": 2.459389098238983e-06, "loss": 1.1448, "step": 17262 }, { "epoch": 0.52, "learning_rate": 2.459145210569251e-06, "loss": 1.0855, "step": 17263 }, { "epoch": 0.52, "learning_rate": 2.4589013232884356e-06, "loss": 1.07, "step": 17264 }, { "epoch": 0.52, "learning_rate": 2.4586574363988602e-06, "loss": 1.1379, "step": 17265 }, { "epoch": 0.52, "learning_rate": 2.4584135499028456e-06, "loss": 1.2043, "step": 17266 }, { "epoch": 0.52, "learning_rate": 2.458169663802715e-06, "loss": 1.129, "step": 17267 }, { "epoch": 0.52, "learning_rate": 2.4579257781007884e-06, "loss": 1.1539, "step": 17268 }, { "epoch": 0.52, "learning_rate": 2.457681892799388e-06, "loss": 1.2358, "step": 17269 }, { "epoch": 0.52, "learning_rate": 2.457438007900836e-06, "loss": 1.1309, "step": 17270 }, { "epoch": 0.52, "learning_rate": 2.457194123407454e-06, "loss": 1.1017, "step": 17271 }, { "epoch": 0.52, "learning_rate": 2.456950239321563e-06, "loss": 1.0195, "step": 17272 }, { "epoch": 0.52, "learning_rate": 2.456706355645485e-06, "loss": 1.0494, "step": 17273 }, { "epoch": 0.52, "learning_rate": 2.4564624723815413e-06, "loss": 1.1647, "step": 17274 }, { "epoch": 0.52, "learning_rate": 2.456218589532054e-06, "loss": 1.0327, "step": 17275 }, { "epoch": 0.52, "learning_rate": 2.4559747070993452e-06, "loss": 1.1293, "step": 17276 }, { "epoch": 0.52, "learning_rate": 2.4557308250857354e-06, "loss": 1.0715, "step": 17277 }, { "epoch": 0.52, "learning_rate": 2.455486943493547e-06, "loss": 1.1666, "step": 17278 }, { "epoch": 0.52, "learning_rate": 2.455243062325101e-06, "loss": 1.2682, "step": 17279 }, { "epoch": 0.52, "learning_rate": 2.4549991815827202e-06, "loss": 0.981, "step": 17280 }, { "epoch": 0.52, "learning_rate": 2.454755301268725e-06, "loss": 1.215, "step": 17281 }, { "epoch": 0.52, "learning_rate": 2.4545114213854375e-06, "loss": 1.1117, "step": 17282 }, { "epoch": 0.52, "learning_rate": 2.4542675419351797e-06, "loss": 1.1492, "step": 17283 }, { "epoch": 0.52, "learning_rate": 2.4540236629202736e-06, "loss": 1.1343, "step": 17284 }, { "epoch": 0.52, "learning_rate": 2.453779784343039e-06, "loss": 1.1115, "step": 17285 }, { "epoch": 0.52, "learning_rate": 2.453535906205799e-06, "loss": 0.9579, "step": 17286 }, { "epoch": 0.52, "learning_rate": 2.4532920285108745e-06, "loss": 1.1698, "step": 17287 }, { "epoch": 0.52, "learning_rate": 2.4530481512605883e-06, "loss": 1.1707, "step": 17288 }, { "epoch": 0.52, "learning_rate": 2.45280427445726e-06, "loss": 1.0921, "step": 17289 }, { "epoch": 0.52, "learning_rate": 2.4525603981032124e-06, "loss": 1.1096, "step": 17290 }, { "epoch": 0.52, "learning_rate": 2.4523165222007674e-06, "loss": 1.1598, "step": 17291 }, { "epoch": 0.52, "learning_rate": 2.4520726467522456e-06, "loss": 1.0413, "step": 17292 }, { "epoch": 0.52, "learning_rate": 2.4518287717599697e-06, "loss": 1.0361, "step": 17293 }, { "epoch": 0.52, "learning_rate": 2.4515848972262604e-06, "loss": 1.0422, "step": 17294 }, { "epoch": 0.52, "learning_rate": 2.451341023153439e-06, "loss": 1.1021, "step": 17295 }, { "epoch": 0.52, "learning_rate": 2.451097149543829e-06, "loss": 1.1716, "step": 17296 }, { "epoch": 0.52, "learning_rate": 2.45085327639975e-06, "loss": 1.0779, "step": 17297 }, { "epoch": 0.52, "learning_rate": 2.450609403723524e-06, "loss": 1.1238, "step": 17298 }, { "epoch": 0.52, "learning_rate": 2.450365531517472e-06, "loss": 1.0933, "step": 17299 }, { "epoch": 0.52, "learning_rate": 2.450121659783917e-06, "loss": 1.1801, "step": 17300 }, { "epoch": 0.52, "learning_rate": 2.4498777885251807e-06, "loss": 1.0212, "step": 17301 }, { "epoch": 0.52, "learning_rate": 2.449633917743582e-06, "loss": 1.1025, "step": 17302 }, { "epoch": 0.52, "learning_rate": 2.449390047441445e-06, "loss": 1.077, "step": 17303 }, { "epoch": 0.52, "learning_rate": 2.44914617762109e-06, "loss": 1.1026, "step": 17304 }, { "epoch": 0.52, "learning_rate": 2.448902308284839e-06, "loss": 1.1251, "step": 17305 }, { "epoch": 0.52, "learning_rate": 2.4486584394350137e-06, "loss": 1.2401, "step": 17306 }, { "epoch": 0.52, "learning_rate": 2.4484145710739356e-06, "loss": 1.1471, "step": 17307 }, { "epoch": 0.52, "learning_rate": 2.4481707032039256e-06, "loss": 1.0778, "step": 17308 }, { "epoch": 0.52, "learning_rate": 2.4479268358273046e-06, "loss": 1.1616, "step": 17309 }, { "epoch": 0.52, "learning_rate": 2.4476829689463966e-06, "loss": 1.155, "step": 17310 }, { "epoch": 0.52, "learning_rate": 2.4474391025635207e-06, "loss": 1.1069, "step": 17311 }, { "epoch": 0.52, "learning_rate": 2.447195236680999e-06, "loss": 1.0345, "step": 17312 }, { "epoch": 0.52, "learning_rate": 2.446951371301153e-06, "loss": 1.29, "step": 17313 }, { "epoch": 0.52, "learning_rate": 2.4467075064263063e-06, "loss": 1.086, "step": 17314 }, { "epoch": 0.52, "learning_rate": 2.4464636420587767e-06, "loss": 1.0287, "step": 17315 }, { "epoch": 0.52, "learning_rate": 2.4462197782008878e-06, "loss": 1.1522, "step": 17316 }, { "epoch": 0.52, "learning_rate": 2.4459759148549604e-06, "loss": 1.1884, "step": 17317 }, { "epoch": 0.52, "learning_rate": 2.4457320520233166e-06, "loss": 1.2281, "step": 17318 }, { "epoch": 0.52, "learning_rate": 2.4454881897082787e-06, "loss": 1.087, "step": 17319 }, { "epoch": 0.52, "learning_rate": 2.4452443279121654e-06, "loss": 1.066, "step": 17320 }, { "epoch": 0.52, "learning_rate": 2.4450004666373e-06, "loss": 1.161, "step": 17321 }, { "epoch": 0.52, "learning_rate": 2.4447566058860036e-06, "loss": 1.0445, "step": 17322 }, { "epoch": 0.52, "learning_rate": 2.444512745660598e-06, "loss": 1.1464, "step": 17323 }, { "epoch": 0.52, "learning_rate": 2.4442688859634044e-06, "loss": 1.099, "step": 17324 }, { "epoch": 0.52, "learning_rate": 2.444025026796744e-06, "loss": 1.163, "step": 17325 }, { "epoch": 0.52, "learning_rate": 2.443781168162938e-06, "loss": 1.2062, "step": 17326 }, { "epoch": 0.52, "learning_rate": 2.4435373100643097e-06, "loss": 1.2445, "step": 17327 }, { "epoch": 0.52, "learning_rate": 2.4432934525031777e-06, "loss": 1.1158, "step": 17328 }, { "epoch": 0.52, "learning_rate": 2.443049595481865e-06, "loss": 1.1733, "step": 17329 }, { "epoch": 0.52, "learning_rate": 2.4428057390026926e-06, "loss": 1.0903, "step": 17330 }, { "epoch": 0.52, "learning_rate": 2.4425618830679816e-06, "loss": 1.1792, "step": 17331 }, { "epoch": 0.52, "learning_rate": 2.4423180276800554e-06, "loss": 1.0982, "step": 17332 }, { "epoch": 0.52, "learning_rate": 2.4420741728412327e-06, "loss": 1.0741, "step": 17333 }, { "epoch": 0.52, "learning_rate": 2.4418303185538356e-06, "loss": 1.0466, "step": 17334 }, { "epoch": 0.52, "learning_rate": 2.441586464820186e-06, "loss": 1.0801, "step": 17335 }, { "epoch": 0.52, "learning_rate": 2.4413426116426057e-06, "loss": 1.1616, "step": 17336 }, { "epoch": 0.52, "learning_rate": 2.441098759023415e-06, "loss": 1.095, "step": 17337 }, { "epoch": 0.52, "learning_rate": 2.4408549069649356e-06, "loss": 1.111, "step": 17338 }, { "epoch": 0.52, "learning_rate": 2.440611055469489e-06, "loss": 1.1277, "step": 17339 }, { "epoch": 0.52, "learning_rate": 2.440367204539398e-06, "loss": 1.0405, "step": 17340 }, { "epoch": 0.52, "learning_rate": 2.440123354176981e-06, "loss": 1.0635, "step": 17341 }, { "epoch": 0.52, "learning_rate": 2.439879504384561e-06, "loss": 1.1838, "step": 17342 }, { "epoch": 0.52, "learning_rate": 2.4396356551644592e-06, "loss": 1.0938, "step": 17343 }, { "epoch": 0.52, "learning_rate": 2.439391806518997e-06, "loss": 1.1682, "step": 17344 }, { "epoch": 0.52, "learning_rate": 2.4391479584504964e-06, "loss": 1.1335, "step": 17345 }, { "epoch": 0.52, "learning_rate": 2.4389041109612773e-06, "loss": 1.1032, "step": 17346 }, { "epoch": 0.52, "learning_rate": 2.438660264053661e-06, "loss": 1.2231, "step": 17347 }, { "epoch": 0.52, "learning_rate": 2.43841641772997e-06, "loss": 1.0873, "step": 17348 }, { "epoch": 0.52, "learning_rate": 2.438172571992525e-06, "loss": 1.1074, "step": 17349 }, { "epoch": 0.52, "learning_rate": 2.4379287268436476e-06, "loss": 1.1044, "step": 17350 }, { "epoch": 0.52, "learning_rate": 2.4376848822856584e-06, "loss": 1.1715, "step": 17351 }, { "epoch": 0.52, "learning_rate": 2.4374410383208787e-06, "loss": 1.1509, "step": 17352 }, { "epoch": 0.52, "learning_rate": 2.4371971949516317e-06, "loss": 1.0618, "step": 17353 }, { "epoch": 0.52, "learning_rate": 2.4369533521802362e-06, "loss": 1.102, "step": 17354 }, { "epoch": 0.52, "learning_rate": 2.4367095100090144e-06, "loss": 1.1424, "step": 17355 }, { "epoch": 0.52, "learning_rate": 2.436465668440287e-06, "loss": 1.1508, "step": 17356 }, { "epoch": 0.52, "learning_rate": 2.4362218274763766e-06, "loss": 1.1642, "step": 17357 }, { "epoch": 0.52, "learning_rate": 2.4359779871196044e-06, "loss": 1.0804, "step": 17358 }, { "epoch": 0.52, "learning_rate": 2.4357341473722897e-06, "loss": 1.0837, "step": 17359 }, { "epoch": 0.52, "learning_rate": 2.4354903082367552e-06, "loss": 1.1935, "step": 17360 }, { "epoch": 0.52, "learning_rate": 2.4352464697153218e-06, "loss": 1.0364, "step": 17361 }, { "epoch": 0.52, "learning_rate": 2.4350026318103114e-06, "loss": 1.2379, "step": 17362 }, { "epoch": 0.52, "learning_rate": 2.4347587945240442e-06, "loss": 1.0444, "step": 17363 }, { "epoch": 0.52, "learning_rate": 2.4345149578588415e-06, "loss": 1.2028, "step": 17364 }, { "epoch": 0.52, "learning_rate": 2.4342711218170254e-06, "loss": 1.1251, "step": 17365 }, { "epoch": 0.52, "learning_rate": 2.434027286400917e-06, "loss": 1.0898, "step": 17366 }, { "epoch": 0.52, "learning_rate": 2.4337834516128365e-06, "loss": 1.1364, "step": 17367 }, { "epoch": 0.52, "learning_rate": 2.433539617455106e-06, "loss": 1.0677, "step": 17368 }, { "epoch": 0.52, "learning_rate": 2.4332957839300457e-06, "loss": 1.1265, "step": 17369 }, { "epoch": 0.52, "learning_rate": 2.4330519510399773e-06, "loss": 1.1703, "step": 17370 }, { "epoch": 0.52, "learning_rate": 2.4328081187872234e-06, "loss": 1.0226, "step": 17371 }, { "epoch": 0.52, "learning_rate": 2.432564287174103e-06, "loss": 1.0934, "step": 17372 }, { "epoch": 0.52, "learning_rate": 2.4323204562029377e-06, "loss": 1.1418, "step": 17373 }, { "epoch": 0.52, "learning_rate": 2.4320766258760495e-06, "loss": 0.9184, "step": 17374 }, { "epoch": 0.52, "learning_rate": 2.4318327961957596e-06, "loss": 1.0257, "step": 17375 }, { "epoch": 0.52, "learning_rate": 2.4315889671643875e-06, "loss": 1.063, "step": 17376 }, { "epoch": 0.52, "learning_rate": 2.431345138784256e-06, "loss": 1.0997, "step": 17377 }, { "epoch": 0.52, "learning_rate": 2.4311013110576856e-06, "loss": 1.1418, "step": 17378 }, { "epoch": 0.52, "learning_rate": 2.4308574839869987e-06, "loss": 1.1218, "step": 17379 }, { "epoch": 0.52, "learning_rate": 2.430613657574514e-06, "loss": 1.0237, "step": 17380 }, { "epoch": 0.52, "learning_rate": 2.430369831822554e-06, "loss": 1.2993, "step": 17381 }, { "epoch": 0.52, "learning_rate": 2.4301260067334394e-06, "loss": 1.1178, "step": 17382 }, { "epoch": 0.52, "learning_rate": 2.429882182309492e-06, "loss": 1.1428, "step": 17383 }, { "epoch": 0.52, "learning_rate": 2.4296383585530333e-06, "loss": 1.0132, "step": 17384 }, { "epoch": 0.52, "learning_rate": 2.4293945354663824e-06, "loss": 1.2723, "step": 17385 }, { "epoch": 0.52, "learning_rate": 2.4291507130518615e-06, "loss": 1.0999, "step": 17386 }, { "epoch": 0.52, "learning_rate": 2.428906891311792e-06, "loss": 1.1902, "step": 17387 }, { "epoch": 0.52, "learning_rate": 2.428663070248495e-06, "loss": 1.1511, "step": 17388 }, { "epoch": 0.52, "learning_rate": 2.4284192498642906e-06, "loss": 1.0613, "step": 17389 }, { "epoch": 0.52, "learning_rate": 2.428175430161501e-06, "loss": 1.0453, "step": 17390 }, { "epoch": 0.52, "learning_rate": 2.4279316111424465e-06, "loss": 1.0773, "step": 17391 }, { "epoch": 0.52, "learning_rate": 2.4276877928094482e-06, "loss": 1.1039, "step": 17392 }, { "epoch": 0.52, "learning_rate": 2.4274439751648273e-06, "loss": 1.1191, "step": 17393 }, { "epoch": 0.52, "learning_rate": 2.4272001582109046e-06, "loss": 1.1356, "step": 17394 }, { "epoch": 0.52, "learning_rate": 2.426956341950002e-06, "loss": 1.2911, "step": 17395 }, { "epoch": 0.52, "learning_rate": 2.426712526384439e-06, "loss": 1.1956, "step": 17396 }, { "epoch": 0.52, "learning_rate": 2.4264687115165386e-06, "loss": 1.1131, "step": 17397 }, { "epoch": 0.52, "learning_rate": 2.42622489734862e-06, "loss": 1.1111, "step": 17398 }, { "epoch": 0.52, "learning_rate": 2.4259810838830046e-06, "loss": 1.1431, "step": 17399 }, { "epoch": 0.52, "learning_rate": 2.4257372711220135e-06, "loss": 1.0328, "step": 17400 }, { "epoch": 0.52, "learning_rate": 2.425493459067969e-06, "loss": 1.2417, "step": 17401 }, { "epoch": 0.52, "learning_rate": 2.42524964772319e-06, "loss": 1.1766, "step": 17402 }, { "epoch": 0.52, "learning_rate": 2.425005837089998e-06, "loss": 1.1356, "step": 17403 }, { "epoch": 0.52, "learning_rate": 2.4247620271707145e-06, "loss": 1.0797, "step": 17404 }, { "epoch": 0.52, "learning_rate": 2.424518217967661e-06, "loss": 1.16, "step": 17405 }, { "epoch": 0.52, "learning_rate": 2.424274409483157e-06, "loss": 1.1111, "step": 17406 }, { "epoch": 0.52, "learning_rate": 2.4240306017195244e-06, "loss": 1.0643, "step": 17407 }, { "epoch": 0.52, "learning_rate": 2.4237867946790834e-06, "loss": 1.1038, "step": 17408 }, { "epoch": 0.52, "learning_rate": 2.423542988364156e-06, "loss": 1.075, "step": 17409 }, { "epoch": 0.52, "learning_rate": 2.423299182777063e-06, "loss": 1.0884, "step": 17410 }, { "epoch": 0.52, "learning_rate": 2.423055377920124e-06, "loss": 1.1324, "step": 17411 }, { "epoch": 0.52, "learning_rate": 2.4228115737956607e-06, "loss": 1.1776, "step": 17412 }, { "epoch": 0.52, "learning_rate": 2.422567770405994e-06, "loss": 1.1614, "step": 17413 }, { "epoch": 0.52, "learning_rate": 2.422323967753446e-06, "loss": 1.1707, "step": 17414 }, { "epoch": 0.52, "learning_rate": 2.4220801658403355e-06, "loss": 1.0814, "step": 17415 }, { "epoch": 0.52, "learning_rate": 2.4218363646689837e-06, "loss": 1.1228, "step": 17416 }, { "epoch": 0.52, "learning_rate": 2.4215925642417127e-06, "loss": 1.2969, "step": 17417 }, { "epoch": 0.52, "learning_rate": 2.421348764560843e-06, "loss": 1.1642, "step": 17418 }, { "epoch": 0.52, "learning_rate": 2.4211049656286946e-06, "loss": 1.17, "step": 17419 }, { "epoch": 0.52, "learning_rate": 2.420861167447589e-06, "loss": 1.1615, "step": 17420 }, { "epoch": 0.52, "learning_rate": 2.420617370019847e-06, "loss": 1.147, "step": 17421 }, { "epoch": 0.52, "learning_rate": 2.4203735733477895e-06, "loss": 1.0044, "step": 17422 }, { "epoch": 0.52, "learning_rate": 2.4201297774337383e-06, "loss": 1.1688, "step": 17423 }, { "epoch": 0.52, "learning_rate": 2.419885982280012e-06, "loss": 1.1048, "step": 17424 }, { "epoch": 0.52, "learning_rate": 2.4196421878889326e-06, "loss": 1.0852, "step": 17425 }, { "epoch": 0.52, "learning_rate": 2.4193983942628207e-06, "loss": 1.1484, "step": 17426 }, { "epoch": 0.52, "learning_rate": 2.4191546014039983e-06, "loss": 1.0784, "step": 17427 }, { "epoch": 0.53, "learning_rate": 2.4189108093147845e-06, "loss": 1.1846, "step": 17428 }, { "epoch": 0.53, "learning_rate": 2.4186670179975006e-06, "loss": 1.0857, "step": 17429 }, { "epoch": 0.53, "learning_rate": 2.418423227454467e-06, "loss": 1.143, "step": 17430 }, { "epoch": 0.53, "learning_rate": 2.418179437688006e-06, "loss": 1.1942, "step": 17431 }, { "epoch": 0.53, "learning_rate": 2.417935648700437e-06, "loss": 1.0575, "step": 17432 }, { "epoch": 0.53, "learning_rate": 2.417691860494081e-06, "loss": 1.0748, "step": 17433 }, { "epoch": 0.53, "learning_rate": 2.4174480730712585e-06, "loss": 1.1414, "step": 17434 }, { "epoch": 0.53, "learning_rate": 2.4172042864342907e-06, "loss": 1.1329, "step": 17435 }, { "epoch": 0.53, "learning_rate": 2.4169605005854994e-06, "loss": 1.1841, "step": 17436 }, { "epoch": 0.53, "learning_rate": 2.4167167155272033e-06, "loss": 1.1453, "step": 17437 }, { "epoch": 0.53, "learning_rate": 2.4164729312617237e-06, "loss": 1.1033, "step": 17438 }, { "epoch": 0.53, "learning_rate": 2.4162291477913814e-06, "loss": 1.1855, "step": 17439 }, { "epoch": 0.53, "learning_rate": 2.415985365118498e-06, "loss": 1.0881, "step": 17440 }, { "epoch": 0.53, "learning_rate": 2.4157415832453933e-06, "loss": 1.1017, "step": 17441 }, { "epoch": 0.53, "learning_rate": 2.415497802174388e-06, "loss": 1.1093, "step": 17442 }, { "epoch": 0.53, "learning_rate": 2.4152540219078024e-06, "loss": 1.0181, "step": 17443 }, { "epoch": 0.53, "learning_rate": 2.4150102424479583e-06, "loss": 1.0013, "step": 17444 }, { "epoch": 0.53, "learning_rate": 2.414766463797176e-06, "loss": 1.0403, "step": 17445 }, { "epoch": 0.53, "learning_rate": 2.414522685957775e-06, "loss": 1.0927, "step": 17446 }, { "epoch": 0.53, "learning_rate": 2.4142789089320772e-06, "loss": 1.0462, "step": 17447 }, { "epoch": 0.53, "learning_rate": 2.414035132722403e-06, "loss": 1.1883, "step": 17448 }, { "epoch": 0.53, "learning_rate": 2.413791357331074e-06, "loss": 1.1961, "step": 17449 }, { "epoch": 0.53, "learning_rate": 2.413547582760408e-06, "loss": 1.1718, "step": 17450 }, { "epoch": 0.53, "learning_rate": 2.4133038090127284e-06, "loss": 1.0242, "step": 17451 }, { "epoch": 0.53, "learning_rate": 2.413060036090354e-06, "loss": 1.0992, "step": 17452 }, { "epoch": 0.53, "learning_rate": 2.412816263995608e-06, "loss": 1.1988, "step": 17453 }, { "epoch": 0.53, "learning_rate": 2.4125724927308075e-06, "loss": 1.0688, "step": 17454 }, { "epoch": 0.53, "learning_rate": 2.412328722298275e-06, "loss": 1.144, "step": 17455 }, { "epoch": 0.53, "learning_rate": 2.412084952700331e-06, "loss": 1.0884, "step": 17456 }, { "epoch": 0.53, "learning_rate": 2.411841183939296e-06, "loss": 1.046, "step": 17457 }, { "epoch": 0.53, "learning_rate": 2.4115974160174902e-06, "loss": 1.2361, "step": 17458 }, { "epoch": 0.53, "learning_rate": 2.4113536489372347e-06, "loss": 1.0396, "step": 17459 }, { "epoch": 0.53, "learning_rate": 2.4111098827008496e-06, "loss": 1.1365, "step": 17460 }, { "epoch": 0.53, "learning_rate": 2.4108661173106556e-06, "loss": 1.085, "step": 17461 }, { "epoch": 0.53, "learning_rate": 2.410622352768974e-06, "loss": 1.1463, "step": 17462 }, { "epoch": 0.53, "learning_rate": 2.4103785890781235e-06, "loss": 1.1874, "step": 17463 }, { "epoch": 0.53, "learning_rate": 2.410134826240426e-06, "loss": 1.2095, "step": 17464 }, { "epoch": 0.53, "learning_rate": 2.4098910642582012e-06, "loss": 1.1809, "step": 17465 }, { "epoch": 0.53, "learning_rate": 2.409647303133772e-06, "loss": 1.0571, "step": 17466 }, { "epoch": 0.53, "learning_rate": 2.4094035428694553e-06, "loss": 1.3047, "step": 17467 }, { "epoch": 0.53, "learning_rate": 2.4091597834675733e-06, "loss": 1.0571, "step": 17468 }, { "epoch": 0.53, "learning_rate": 2.4089160249304462e-06, "loss": 1.1541, "step": 17469 }, { "epoch": 0.53, "learning_rate": 2.4086722672603955e-06, "loss": 1.1536, "step": 17470 }, { "epoch": 0.53, "learning_rate": 2.4084285104597402e-06, "loss": 1.0436, "step": 17471 }, { "epoch": 0.53, "learning_rate": 2.4081847545308017e-06, "loss": 1.0541, "step": 17472 }, { "epoch": 0.53, "learning_rate": 2.4079409994759e-06, "loss": 1.1071, "step": 17473 }, { "epoch": 0.53, "learning_rate": 2.407697245297356e-06, "loss": 1.098, "step": 17474 }, { "epoch": 0.53, "learning_rate": 2.407453491997489e-06, "loss": 1.1298, "step": 17475 }, { "epoch": 0.53, "learning_rate": 2.4072097395786208e-06, "loss": 1.0653, "step": 17476 }, { "epoch": 0.53, "learning_rate": 2.4069659880430702e-06, "loss": 1.0365, "step": 17477 }, { "epoch": 0.53, "learning_rate": 2.4067222373931595e-06, "loss": 1.1666, "step": 17478 }, { "epoch": 0.53, "learning_rate": 2.4064784876312087e-06, "loss": 1.1037, "step": 17479 }, { "epoch": 0.53, "learning_rate": 2.406234738759537e-06, "loss": 1.2514, "step": 17480 }, { "epoch": 0.53, "learning_rate": 2.4059909907804655e-06, "loss": 1.1107, "step": 17481 }, { "epoch": 0.53, "learning_rate": 2.405747243696314e-06, "loss": 1.1612, "step": 17482 }, { "epoch": 0.53, "learning_rate": 2.4055034975094047e-06, "loss": 1.1406, "step": 17483 }, { "epoch": 0.53, "learning_rate": 2.4052597522220554e-06, "loss": 1.1508, "step": 17484 }, { "epoch": 0.53, "learning_rate": 2.4050160078365878e-06, "loss": 1.03, "step": 17485 }, { "epoch": 0.53, "learning_rate": 2.404772264355322e-06, "loss": 1.3003, "step": 17486 }, { "epoch": 0.53, "learning_rate": 2.404528521780579e-06, "loss": 1.2161, "step": 17487 }, { "epoch": 0.53, "learning_rate": 2.4042847801146775e-06, "loss": 1.1579, "step": 17488 }, { "epoch": 0.53, "learning_rate": 2.404041039359939e-06, "loss": 1.1448, "step": 17489 }, { "epoch": 0.53, "learning_rate": 2.403797299518684e-06, "loss": 1.137, "step": 17490 }, { "epoch": 0.53, "learning_rate": 2.403553560593232e-06, "loss": 1.1056, "step": 17491 }, { "epoch": 0.53, "learning_rate": 2.403309822585905e-06, "loss": 1.149, "step": 17492 }, { "epoch": 0.53, "learning_rate": 2.4030660854990206e-06, "loss": 1.185, "step": 17493 }, { "epoch": 0.53, "learning_rate": 2.4028223493349005e-06, "loss": 1.1241, "step": 17494 }, { "epoch": 0.53, "learning_rate": 2.402578614095865e-06, "loss": 1.1036, "step": 17495 }, { "epoch": 0.53, "learning_rate": 2.402334879784235e-06, "loss": 1.1577, "step": 17496 }, { "epoch": 0.53, "learning_rate": 2.4020911464023285e-06, "loss": 1.1218, "step": 17497 }, { "epoch": 0.53, "learning_rate": 2.4018474139524678e-06, "loss": 1.1126, "step": 17498 }, { "epoch": 0.53, "learning_rate": 2.401603682436972e-06, "loss": 1.1157, "step": 17499 }, { "epoch": 0.53, "learning_rate": 2.4013599518581626e-06, "loss": 1.1514, "step": 17500 }, { "epoch": 0.53, "learning_rate": 2.4011162222183583e-06, "loss": 1.0945, "step": 17501 }, { "epoch": 0.53, "learning_rate": 2.4008724935198794e-06, "loss": 1.0563, "step": 17502 }, { "epoch": 0.53, "learning_rate": 2.4006287657650473e-06, "loss": 1.1799, "step": 17503 }, { "epoch": 0.53, "learning_rate": 2.4003850389561813e-06, "loss": 1.1461, "step": 17504 }, { "epoch": 0.53, "learning_rate": 2.400141313095603e-06, "loss": 1.2092, "step": 17505 }, { "epoch": 0.53, "learning_rate": 2.39989758818563e-06, "loss": 1.0872, "step": 17506 }, { "epoch": 0.53, "learning_rate": 2.3996538642285837e-06, "loss": 1.136, "step": 17507 }, { "epoch": 0.53, "learning_rate": 2.3994101412267847e-06, "loss": 1.097, "step": 17508 }, { "epoch": 0.53, "learning_rate": 2.3991664191825535e-06, "loss": 1.1231, "step": 17509 }, { "epoch": 0.53, "learning_rate": 2.398922698098208e-06, "loss": 1.187, "step": 17510 }, { "epoch": 0.53, "learning_rate": 2.3986789779760702e-06, "loss": 1.1123, "step": 17511 }, { "epoch": 0.53, "learning_rate": 2.3984352588184595e-06, "loss": 1.1597, "step": 17512 }, { "epoch": 0.53, "learning_rate": 2.398191540627697e-06, "loss": 1.0622, "step": 17513 }, { "epoch": 0.53, "learning_rate": 2.3979478234061014e-06, "loss": 1.0998, "step": 17514 }, { "epoch": 0.53, "learning_rate": 2.397704107155993e-06, "loss": 1.1529, "step": 17515 }, { "epoch": 0.53, "learning_rate": 2.3974603918796928e-06, "loss": 1.0825, "step": 17516 }, { "epoch": 0.53, "learning_rate": 2.39721667757952e-06, "loss": 1.2434, "step": 17517 }, { "epoch": 0.53, "learning_rate": 2.396972964257796e-06, "loss": 1.1719, "step": 17518 }, { "epoch": 0.53, "learning_rate": 2.396729251916839e-06, "loss": 1.3412, "step": 17519 }, { "epoch": 0.53, "learning_rate": 2.3964855405589692e-06, "loss": 1.101, "step": 17520 }, { "epoch": 0.53, "learning_rate": 2.3962418301865073e-06, "loss": 1.0184, "step": 17521 }, { "epoch": 0.53, "learning_rate": 2.3959981208017747e-06, "loss": 1.1516, "step": 17522 }, { "epoch": 0.53, "learning_rate": 2.3957544124070885e-06, "loss": 1.2139, "step": 17523 }, { "epoch": 0.53, "learning_rate": 2.39551070500477e-06, "loss": 1.0786, "step": 17524 }, { "epoch": 0.53, "learning_rate": 2.3952669985971393e-06, "loss": 1.2545, "step": 17525 }, { "epoch": 0.53, "learning_rate": 2.395023293186517e-06, "loss": 1.1326, "step": 17526 }, { "epoch": 0.53, "learning_rate": 2.394779588775222e-06, "loss": 1.0791, "step": 17527 }, { "epoch": 0.53, "learning_rate": 2.3945358853655745e-06, "loss": 1.117, "step": 17528 }, { "epoch": 0.53, "learning_rate": 2.394292182959895e-06, "loss": 1.194, "step": 17529 }, { "epoch": 0.53, "learning_rate": 2.3940484815605023e-06, "loss": 1.2418, "step": 17530 }, { "epoch": 0.53, "learning_rate": 2.3938047811697184e-06, "loss": 1.0992, "step": 17531 }, { "epoch": 0.53, "learning_rate": 2.3935610817898608e-06, "loss": 1.2571, "step": 17532 }, { "epoch": 0.53, "learning_rate": 2.39331738342325e-06, "loss": 1.1228, "step": 17533 }, { "epoch": 0.53, "learning_rate": 2.393073686072207e-06, "loss": 1.1677, "step": 17534 }, { "epoch": 0.53, "learning_rate": 2.392829989739052e-06, "loss": 1.1212, "step": 17535 }, { "epoch": 0.53, "learning_rate": 2.3925862944261023e-06, "loss": 1.1574, "step": 17536 }, { "epoch": 0.53, "learning_rate": 2.3923426001356798e-06, "loss": 1.1441, "step": 17537 }, { "epoch": 0.53, "learning_rate": 2.3920989068701036e-06, "loss": 1.1611, "step": 17538 }, { "epoch": 0.53, "learning_rate": 2.3918552146316946e-06, "loss": 1.1274, "step": 17539 }, { "epoch": 0.53, "learning_rate": 2.391611523422771e-06, "loss": 1.008, "step": 17540 }, { "epoch": 0.53, "learning_rate": 2.391367833245654e-06, "loss": 1.0817, "step": 17541 }, { "epoch": 0.53, "learning_rate": 2.3911241441026627e-06, "loss": 1.194, "step": 17542 }, { "epoch": 0.53, "learning_rate": 2.3908804559961177e-06, "loss": 1.1248, "step": 17543 }, { "epoch": 0.53, "learning_rate": 2.390636768928338e-06, "loss": 1.1419, "step": 17544 }, { "epoch": 0.53, "learning_rate": 2.3903930829016434e-06, "loss": 1.1488, "step": 17545 }, { "epoch": 0.53, "learning_rate": 2.3901493979183537e-06, "loss": 1.0516, "step": 17546 }, { "epoch": 0.53, "learning_rate": 2.3899057139807884e-06, "loss": 1.1107, "step": 17547 }, { "epoch": 0.53, "learning_rate": 2.3896620310912693e-06, "loss": 1.0805, "step": 17548 }, { "epoch": 0.53, "learning_rate": 2.3894183492521133e-06, "loss": 1.1737, "step": 17549 }, { "epoch": 0.53, "learning_rate": 2.3891746684656415e-06, "loss": 1.0006, "step": 17550 }, { "epoch": 0.53, "learning_rate": 2.388930988734173e-06, "loss": 1.2317, "step": 17551 }, { "epoch": 0.53, "learning_rate": 2.388687310060029e-06, "loss": 1.019, "step": 17552 }, { "epoch": 0.53, "learning_rate": 2.3884436324455272e-06, "loss": 1.2075, "step": 17553 }, { "epoch": 0.53, "learning_rate": 2.3881999558929894e-06, "loss": 1.0847, "step": 17554 }, { "epoch": 0.53, "learning_rate": 2.387956280404733e-06, "loss": 1.2036, "step": 17555 }, { "epoch": 0.53, "learning_rate": 2.3877126059830795e-06, "loss": 0.9817, "step": 17556 }, { "epoch": 0.53, "learning_rate": 2.3874689326303483e-06, "loss": 1.1559, "step": 17557 }, { "epoch": 0.53, "learning_rate": 2.387225260348858e-06, "loss": 1.0738, "step": 17558 }, { "epoch": 0.53, "learning_rate": 2.3869815891409287e-06, "loss": 1.0724, "step": 17559 }, { "epoch": 0.53, "learning_rate": 2.3867379190088803e-06, "loss": 1.1315, "step": 17560 }, { "epoch": 0.53, "learning_rate": 2.386494249955034e-06, "loss": 1.1295, "step": 17561 }, { "epoch": 0.53, "learning_rate": 2.3862505819817062e-06, "loss": 1.203, "step": 17562 }, { "epoch": 0.53, "learning_rate": 2.386006915091218e-06, "loss": 1.1284, "step": 17563 }, { "epoch": 0.53, "learning_rate": 2.3857632492858894e-06, "loss": 1.0862, "step": 17564 }, { "epoch": 0.53, "learning_rate": 2.3855195845680404e-06, "loss": 1.1348, "step": 17565 }, { "epoch": 0.53, "learning_rate": 2.385275920939989e-06, "loss": 1.0286, "step": 17566 }, { "epoch": 0.53, "learning_rate": 2.3850322584040554e-06, "loss": 1.029, "step": 17567 }, { "epoch": 0.53, "learning_rate": 2.384788596962559e-06, "loss": 1.2325, "step": 17568 }, { "epoch": 0.53, "learning_rate": 2.38454493661782e-06, "loss": 1.0407, "step": 17569 }, { "epoch": 0.53, "learning_rate": 2.3843012773721584e-06, "loss": 1.1835, "step": 17570 }, { "epoch": 0.53, "learning_rate": 2.3840576192278924e-06, "loss": 1.0495, "step": 17571 }, { "epoch": 0.53, "learning_rate": 2.3838139621873416e-06, "loss": 1.0914, "step": 17572 }, { "epoch": 0.53, "learning_rate": 2.383570306252826e-06, "loss": 1.1352, "step": 17573 }, { "epoch": 0.53, "learning_rate": 2.3833266514266665e-06, "loss": 1.0275, "step": 17574 }, { "epoch": 0.53, "learning_rate": 2.3830829977111796e-06, "loss": 1.2062, "step": 17575 }, { "epoch": 0.53, "learning_rate": 2.3828393451086864e-06, "loss": 1.1512, "step": 17576 }, { "epoch": 0.53, "learning_rate": 2.3825956936215064e-06, "loss": 1.1555, "step": 17577 }, { "epoch": 0.53, "learning_rate": 2.3823520432519593e-06, "loss": 1.1034, "step": 17578 }, { "epoch": 0.53, "learning_rate": 2.382108394002364e-06, "loss": 0.9765, "step": 17579 }, { "epoch": 0.53, "learning_rate": 2.381864745875039e-06, "loss": 1.2057, "step": 17580 }, { "epoch": 0.53, "learning_rate": 2.3816210988723053e-06, "loss": 1.0067, "step": 17581 }, { "epoch": 0.53, "learning_rate": 2.381377452996482e-06, "loss": 1.0598, "step": 17582 }, { "epoch": 0.53, "learning_rate": 2.381133808249888e-06, "loss": 1.1963, "step": 17583 }, { "epoch": 0.53, "learning_rate": 2.3808901646348426e-06, "loss": 1.1419, "step": 17584 }, { "epoch": 0.53, "learning_rate": 2.3806465221536654e-06, "loss": 1.1872, "step": 17585 }, { "epoch": 0.53, "learning_rate": 2.3804028808086763e-06, "loss": 1.175, "step": 17586 }, { "epoch": 0.53, "learning_rate": 2.3801592406021947e-06, "loss": 1.252, "step": 17587 }, { "epoch": 0.53, "learning_rate": 2.3799156015365386e-06, "loss": 1.1218, "step": 17588 }, { "epoch": 0.53, "learning_rate": 2.379671963614028e-06, "loss": 0.9729, "step": 17589 }, { "epoch": 0.53, "learning_rate": 2.3794283268369826e-06, "loss": 1.1866, "step": 17590 }, { "epoch": 0.53, "learning_rate": 2.379184691207722e-06, "loss": 1.1141, "step": 17591 }, { "epoch": 0.53, "learning_rate": 2.378941056728565e-06, "loss": 1.0474, "step": 17592 }, { "epoch": 0.53, "learning_rate": 2.3786974234018297e-06, "loss": 1.1773, "step": 17593 }, { "epoch": 0.53, "learning_rate": 2.3784537912298373e-06, "loss": 1.0433, "step": 17594 }, { "epoch": 0.53, "learning_rate": 2.3782101602149058e-06, "loss": 1.0385, "step": 17595 }, { "epoch": 0.53, "learning_rate": 2.3779665303593553e-06, "loss": 1.1609, "step": 17596 }, { "epoch": 0.53, "learning_rate": 2.3777229016655045e-06, "loss": 1.1738, "step": 17597 }, { "epoch": 0.53, "learning_rate": 2.3774792741356728e-06, "loss": 1.0848, "step": 17598 }, { "epoch": 0.53, "learning_rate": 2.377235647772179e-06, "loss": 1.1689, "step": 17599 }, { "epoch": 0.53, "learning_rate": 2.376992022577344e-06, "loss": 1.0599, "step": 17600 }, { "epoch": 0.53, "learning_rate": 2.376748398553485e-06, "loss": 1.1754, "step": 17601 }, { "epoch": 0.53, "learning_rate": 2.3765047757029214e-06, "loss": 1.1278, "step": 17602 }, { "epoch": 0.53, "learning_rate": 2.376261154027973e-06, "loss": 1.144, "step": 17603 }, { "epoch": 0.53, "learning_rate": 2.37601753353096e-06, "loss": 1.2076, "step": 17604 }, { "epoch": 0.53, "learning_rate": 2.375773914214199e-06, "loss": 1.1058, "step": 17605 }, { "epoch": 0.53, "learning_rate": 2.375530296080011e-06, "loss": 1.0732, "step": 17606 }, { "epoch": 0.53, "learning_rate": 2.375286679130714e-06, "loss": 1.1516, "step": 17607 }, { "epoch": 0.53, "learning_rate": 2.3750430633686285e-06, "loss": 1.0702, "step": 17608 }, { "epoch": 0.53, "learning_rate": 2.3747994487960727e-06, "loss": 1.0953, "step": 17609 }, { "epoch": 0.53, "learning_rate": 2.3745558354153656e-06, "loss": 1.2019, "step": 17610 }, { "epoch": 0.53, "learning_rate": 2.3743122232288266e-06, "loss": 1.1728, "step": 17611 }, { "epoch": 0.53, "learning_rate": 2.3740686122387747e-06, "loss": 1.2184, "step": 17612 }, { "epoch": 0.53, "learning_rate": 2.3738250024475297e-06, "loss": 1.1418, "step": 17613 }, { "epoch": 0.53, "learning_rate": 2.3735813938574093e-06, "loss": 1.1509, "step": 17614 }, { "epoch": 0.53, "learning_rate": 2.373337786470733e-06, "loss": 1.0472, "step": 17615 }, { "epoch": 0.53, "learning_rate": 2.3730941802898198e-06, "loss": 1.1208, "step": 17616 }, { "epoch": 0.53, "learning_rate": 2.37285057531699e-06, "loss": 1.0867, "step": 17617 }, { "epoch": 0.53, "learning_rate": 2.372606971554561e-06, "loss": 1.1816, "step": 17618 }, { "epoch": 0.53, "learning_rate": 2.3723633690048513e-06, "loss": 1.1145, "step": 17619 }, { "epoch": 0.53, "learning_rate": 2.3721197676701817e-06, "loss": 1.1307, "step": 17620 }, { "epoch": 0.53, "learning_rate": 2.3718761675528696e-06, "loss": 1.0723, "step": 17621 }, { "epoch": 0.53, "learning_rate": 2.3716325686552353e-06, "loss": 1.0707, "step": 17622 }, { "epoch": 0.53, "learning_rate": 2.371388970979597e-06, "loss": 1.1075, "step": 17623 }, { "epoch": 0.53, "learning_rate": 2.371145374528274e-06, "loss": 1.1747, "step": 17624 }, { "epoch": 0.53, "learning_rate": 2.3709017793035845e-06, "loss": 1.0797, "step": 17625 }, { "epoch": 0.53, "learning_rate": 2.370658185307849e-06, "loss": 1.1582, "step": 17626 }, { "epoch": 0.53, "learning_rate": 2.370414592543384e-06, "loss": 1.0795, "step": 17627 }, { "epoch": 0.53, "learning_rate": 2.37017100101251e-06, "loss": 1.1127, "step": 17628 }, { "epoch": 0.53, "learning_rate": 2.3699274107175454e-06, "loss": 1.0408, "step": 17629 }, { "epoch": 0.53, "learning_rate": 2.3696838216608102e-06, "loss": 1.2205, "step": 17630 }, { "epoch": 0.53, "learning_rate": 2.3694402338446217e-06, "loss": 1.2086, "step": 17631 }, { "epoch": 0.53, "learning_rate": 2.3691966472712986e-06, "loss": 1.1552, "step": 17632 }, { "epoch": 0.53, "learning_rate": 2.368953061943161e-06, "loss": 1.1519, "step": 17633 }, { "epoch": 0.53, "learning_rate": 2.3687094778625267e-06, "loss": 1.0887, "step": 17634 }, { "epoch": 0.53, "learning_rate": 2.368465895031716e-06, "loss": 1.033, "step": 17635 }, { "epoch": 0.53, "learning_rate": 2.3682223134530457e-06, "loss": 1.022, "step": 17636 }, { "epoch": 0.53, "learning_rate": 2.3679787331288357e-06, "loss": 1.1217, "step": 17637 }, { "epoch": 0.53, "learning_rate": 2.3677351540614044e-06, "loss": 1.142, "step": 17638 }, { "epoch": 0.53, "learning_rate": 2.3674915762530716e-06, "loss": 1.0801, "step": 17639 }, { "epoch": 0.53, "learning_rate": 2.367247999706154e-06, "loss": 1.1133, "step": 17640 }, { "epoch": 0.53, "learning_rate": 2.3670044244229717e-06, "loss": 1.0511, "step": 17641 }, { "epoch": 0.53, "learning_rate": 2.3667608504058436e-06, "loss": 1.1578, "step": 17642 }, { "epoch": 0.53, "learning_rate": 2.3665172776570888e-06, "loss": 1.2176, "step": 17643 }, { "epoch": 0.53, "learning_rate": 2.366273706179024e-06, "loss": 1.0876, "step": 17644 }, { "epoch": 0.53, "learning_rate": 2.3660301359739698e-06, "loss": 1.0469, "step": 17645 }, { "epoch": 0.53, "learning_rate": 2.3657865670442434e-06, "loss": 0.992, "step": 17646 }, { "epoch": 0.53, "learning_rate": 2.3655429993921647e-06, "loss": 1.1516, "step": 17647 }, { "epoch": 0.53, "learning_rate": 2.365299433020053e-06, "loss": 1.1237, "step": 17648 }, { "epoch": 0.53, "learning_rate": 2.3650558679302244e-06, "loss": 1.1763, "step": 17649 }, { "epoch": 0.53, "learning_rate": 2.364812304124999e-06, "loss": 1.0018, "step": 17650 }, { "epoch": 0.53, "learning_rate": 2.3645687416066956e-06, "loss": 1.0552, "step": 17651 }, { "epoch": 0.53, "learning_rate": 2.364325180377633e-06, "loss": 1.1616, "step": 17652 }, { "epoch": 0.53, "learning_rate": 2.3640816204401287e-06, "loss": 1.2418, "step": 17653 }, { "epoch": 0.53, "learning_rate": 2.363838061796502e-06, "loss": 1.2067, "step": 17654 }, { "epoch": 0.53, "learning_rate": 2.363594504449071e-06, "loss": 1.2664, "step": 17655 }, { "epoch": 0.53, "learning_rate": 2.363350948400156e-06, "loss": 1.209, "step": 17656 }, { "epoch": 0.53, "learning_rate": 2.3631073936520734e-06, "loss": 1.144, "step": 17657 }, { "epoch": 0.53, "learning_rate": 2.3628638402071423e-06, "loss": 1.1783, "step": 17658 }, { "epoch": 0.53, "learning_rate": 2.3626202880676813e-06, "loss": 1.1355, "step": 17659 }, { "epoch": 0.53, "learning_rate": 2.3623767372360103e-06, "loss": 1.2216, "step": 17660 }, { "epoch": 0.53, "learning_rate": 2.3621331877144448e-06, "loss": 1.1909, "step": 17661 }, { "epoch": 0.53, "learning_rate": 2.3618896395053055e-06, "loss": 1.1938, "step": 17662 }, { "epoch": 0.53, "learning_rate": 2.36164609261091e-06, "loss": 1.0986, "step": 17663 }, { "epoch": 0.53, "learning_rate": 2.3614025470335776e-06, "loss": 1.1959, "step": 17664 }, { "epoch": 0.53, "learning_rate": 2.361159002775626e-06, "loss": 1.0764, "step": 17665 }, { "epoch": 0.53, "learning_rate": 2.3609154598393736e-06, "loss": 1.0317, "step": 17666 }, { "epoch": 0.53, "learning_rate": 2.360671918227139e-06, "loss": 1.174, "step": 17667 }, { "epoch": 0.53, "learning_rate": 2.360428377941241e-06, "loss": 1.1969, "step": 17668 }, { "epoch": 0.53, "learning_rate": 2.3601848389839983e-06, "loss": 1.1725, "step": 17669 }, { "epoch": 0.53, "learning_rate": 2.3599413013577277e-06, "loss": 1.0941, "step": 17670 }, { "epoch": 0.53, "learning_rate": 2.3596977650647483e-06, "loss": 1.0359, "step": 17671 }, { "epoch": 0.53, "learning_rate": 2.359454230107379e-06, "loss": 1.1547, "step": 17672 }, { "epoch": 0.53, "learning_rate": 2.3592106964879385e-06, "loss": 1.2212, "step": 17673 }, { "epoch": 0.53, "learning_rate": 2.3589671642087433e-06, "loss": 1.0464, "step": 17674 }, { "epoch": 0.53, "learning_rate": 2.3587236332721128e-06, "loss": 1.1272, "step": 17675 }, { "epoch": 0.53, "learning_rate": 2.358480103680365e-06, "loss": 1.1438, "step": 17676 }, { "epoch": 0.53, "learning_rate": 2.3582365754358187e-06, "loss": 1.0723, "step": 17677 }, { "epoch": 0.53, "learning_rate": 2.3579930485407927e-06, "loss": 1.081, "step": 17678 }, { "epoch": 0.53, "learning_rate": 2.3577495229976034e-06, "loss": 1.0726, "step": 17679 }, { "epoch": 0.53, "learning_rate": 2.3575059988085707e-06, "loss": 1.132, "step": 17680 }, { "epoch": 0.53, "learning_rate": 2.357262475976012e-06, "loss": 1.2581, "step": 17681 }, { "epoch": 0.53, "learning_rate": 2.357018954502247e-06, "loss": 1.0742, "step": 17682 }, { "epoch": 0.53, "learning_rate": 2.356775434389591e-06, "loss": 1.1098, "step": 17683 }, { "epoch": 0.53, "learning_rate": 2.3565319156403646e-06, "loss": 1.0981, "step": 17684 }, { "epoch": 0.53, "learning_rate": 2.356288398256885e-06, "loss": 1.1154, "step": 17685 }, { "epoch": 0.53, "learning_rate": 2.356044882241472e-06, "loss": 1.0662, "step": 17686 }, { "epoch": 0.53, "learning_rate": 2.3558013675964407e-06, "loss": 1.1622, "step": 17687 }, { "epoch": 0.53, "learning_rate": 2.3555578543241114e-06, "loss": 1.0373, "step": 17688 }, { "epoch": 0.53, "learning_rate": 2.355314342426802e-06, "loss": 1.1486, "step": 17689 }, { "epoch": 0.53, "learning_rate": 2.3550708319068295e-06, "loss": 1.1667, "step": 17690 }, { "epoch": 0.53, "learning_rate": 2.354827322766514e-06, "loss": 1.0435, "step": 17691 }, { "epoch": 0.53, "learning_rate": 2.354583815008172e-06, "loss": 1.1771, "step": 17692 }, { "epoch": 0.53, "learning_rate": 2.354340308634122e-06, "loss": 1.2823, "step": 17693 }, { "epoch": 0.53, "learning_rate": 2.354096803646682e-06, "loss": 1.2742, "step": 17694 }, { "epoch": 0.53, "learning_rate": 2.3538533000481712e-06, "loss": 1.0568, "step": 17695 }, { "epoch": 0.53, "learning_rate": 2.353609797840906e-06, "loss": 1.0914, "step": 17696 }, { "epoch": 0.53, "learning_rate": 2.3533662970272044e-06, "loss": 1.1129, "step": 17697 }, { "epoch": 0.53, "learning_rate": 2.353122797609385e-06, "loss": 1.0983, "step": 17698 }, { "epoch": 0.53, "learning_rate": 2.3528792995897674e-06, "loss": 1.0754, "step": 17699 }, { "epoch": 0.53, "learning_rate": 2.3526358029706665e-06, "loss": 1.1229, "step": 17700 }, { "epoch": 0.53, "learning_rate": 2.352392307754402e-06, "loss": 1.0343, "step": 17701 }, { "epoch": 0.53, "learning_rate": 2.3521488139432917e-06, "loss": 1.0056, "step": 17702 }, { "epoch": 0.53, "learning_rate": 2.3519053215396536e-06, "loss": 1.0602, "step": 17703 }, { "epoch": 0.53, "learning_rate": 2.3516618305458057e-06, "loss": 1.0366, "step": 17704 }, { "epoch": 0.53, "learning_rate": 2.3514183409640655e-06, "loss": 1.1312, "step": 17705 }, { "epoch": 0.53, "learning_rate": 2.351174852796751e-06, "loss": 1.2712, "step": 17706 }, { "epoch": 0.53, "learning_rate": 2.35093136604618e-06, "loss": 1.1349, "step": 17707 }, { "epoch": 0.53, "learning_rate": 2.350687880714672e-06, "loss": 1.1036, "step": 17708 }, { "epoch": 0.53, "learning_rate": 2.350444396804542e-06, "loss": 1.0292, "step": 17709 }, { "epoch": 0.53, "learning_rate": 2.3502009143181097e-06, "loss": 1.0749, "step": 17710 }, { "epoch": 0.53, "learning_rate": 2.3499574332576924e-06, "loss": 1.0879, "step": 17711 }, { "epoch": 0.53, "learning_rate": 2.349713953625609e-06, "loss": 1.1512, "step": 17712 }, { "epoch": 0.53, "learning_rate": 2.3494704754241757e-06, "loss": 1.0901, "step": 17713 }, { "epoch": 0.53, "learning_rate": 2.3492269986557104e-06, "loss": 1.1611, "step": 17714 }, { "epoch": 0.53, "learning_rate": 2.3489835233225323e-06, "loss": 1.1308, "step": 17715 }, { "epoch": 0.53, "learning_rate": 2.3487400494269575e-06, "loss": 1.1646, "step": 17716 }, { "epoch": 0.53, "learning_rate": 2.3484965769713057e-06, "loss": 1.2386, "step": 17717 }, { "epoch": 0.53, "learning_rate": 2.3482531059578927e-06, "loss": 1.1967, "step": 17718 }, { "epoch": 0.53, "learning_rate": 2.3480096363890376e-06, "loss": 1.1808, "step": 17719 }, { "epoch": 0.53, "learning_rate": 2.347766168267057e-06, "loss": 1.1082, "step": 17720 }, { "epoch": 0.53, "learning_rate": 2.34752270159427e-06, "loss": 1.0819, "step": 17721 }, { "epoch": 0.53, "learning_rate": 2.3472792363729922e-06, "loss": 1.0786, "step": 17722 }, { "epoch": 0.53, "learning_rate": 2.3470357726055433e-06, "loss": 1.0447, "step": 17723 }, { "epoch": 0.53, "learning_rate": 2.3467923102942397e-06, "loss": 1.0661, "step": 17724 }, { "epoch": 0.53, "learning_rate": 2.3465488494414007e-06, "loss": 1.1066, "step": 17725 }, { "epoch": 0.53, "learning_rate": 2.346305390049342e-06, "loss": 1.1354, "step": 17726 }, { "epoch": 0.53, "learning_rate": 2.3460619321203814e-06, "loss": 1.1445, "step": 17727 }, { "epoch": 0.53, "learning_rate": 2.345818475656837e-06, "loss": 1.124, "step": 17728 }, { "epoch": 0.53, "learning_rate": 2.345575020661027e-06, "loss": 1.0741, "step": 17729 }, { "epoch": 0.53, "learning_rate": 2.3453315671352695e-06, "loss": 1.157, "step": 17730 }, { "epoch": 0.53, "learning_rate": 2.3450881150818797e-06, "loss": 1.1747, "step": 17731 }, { "epoch": 0.53, "learning_rate": 2.3448446645031763e-06, "loss": 1.0806, "step": 17732 }, { "epoch": 0.53, "learning_rate": 2.3446012154014773e-06, "loss": 1.1905, "step": 17733 }, { "epoch": 0.53, "learning_rate": 2.3443577677791002e-06, "loss": 1.0507, "step": 17734 }, { "epoch": 0.53, "learning_rate": 2.3441143216383616e-06, "loss": 1.0651, "step": 17735 }, { "epoch": 0.53, "learning_rate": 2.34387087698158e-06, "loss": 1.2676, "step": 17736 }, { "epoch": 0.53, "learning_rate": 2.343627433811072e-06, "loss": 1.2244, "step": 17737 }, { "epoch": 0.53, "learning_rate": 2.3433839921291567e-06, "loss": 1.0086, "step": 17738 }, { "epoch": 0.53, "learning_rate": 2.343140551938149e-06, "loss": 1.0541, "step": 17739 }, { "epoch": 0.53, "learning_rate": 2.342897113240368e-06, "loss": 1.0024, "step": 17740 }, { "epoch": 0.53, "learning_rate": 2.342653676038131e-06, "loss": 1.0677, "step": 17741 }, { "epoch": 0.53, "learning_rate": 2.3424102403337552e-06, "loss": 1.2397, "step": 17742 }, { "epoch": 0.53, "learning_rate": 2.3421668061295586e-06, "loss": 1.3438, "step": 17743 }, { "epoch": 0.53, "learning_rate": 2.3419233734278575e-06, "loss": 1.2859, "step": 17744 }, { "epoch": 0.53, "learning_rate": 2.3416799422309696e-06, "loss": 1.2361, "step": 17745 }, { "epoch": 0.53, "learning_rate": 2.341436512541212e-06, "loss": 1.0815, "step": 17746 }, { "epoch": 0.53, "learning_rate": 2.341193084360904e-06, "loss": 1.0182, "step": 17747 }, { "epoch": 0.53, "learning_rate": 2.34094965769236e-06, "loss": 1.1594, "step": 17748 }, { "epoch": 0.53, "learning_rate": 2.3407062325378986e-06, "loss": 1.139, "step": 17749 }, { "epoch": 0.53, "learning_rate": 2.340462808899837e-06, "loss": 1.1591, "step": 17750 }, { "epoch": 0.53, "learning_rate": 2.340219386780494e-06, "loss": 1.1192, "step": 17751 }, { "epoch": 0.53, "learning_rate": 2.339975966182185e-06, "loss": 1.1324, "step": 17752 }, { "epoch": 0.53, "learning_rate": 2.339732547107227e-06, "loss": 1.0408, "step": 17753 }, { "epoch": 0.53, "learning_rate": 2.339489129557938e-06, "loss": 1.1288, "step": 17754 }, { "epoch": 0.53, "learning_rate": 2.3392457135366353e-06, "loss": 1.217, "step": 17755 }, { "epoch": 0.53, "learning_rate": 2.3390022990456372e-06, "loss": 1.1371, "step": 17756 }, { "epoch": 0.53, "learning_rate": 2.338758886087258e-06, "loss": 1.0761, "step": 17757 }, { "epoch": 0.53, "learning_rate": 2.3385154746638173e-06, "loss": 1.0597, "step": 17758 }, { "epoch": 0.53, "learning_rate": 2.338272064777631e-06, "loss": 0.9728, "step": 17759 }, { "epoch": 0.54, "learning_rate": 2.338028656431018e-06, "loss": 1.0994, "step": 17760 }, { "epoch": 0.54, "learning_rate": 2.337785249626293e-06, "loss": 1.175, "step": 17761 }, { "epoch": 0.54, "learning_rate": 2.3375418443657745e-06, "loss": 1.1479, "step": 17762 }, { "epoch": 0.54, "learning_rate": 2.337298440651779e-06, "loss": 1.1619, "step": 17763 }, { "epoch": 0.54, "learning_rate": 2.3370550384866257e-06, "loss": 1.1138, "step": 17764 }, { "epoch": 0.54, "learning_rate": 2.3368116378726286e-06, "loss": 1.1061, "step": 17765 }, { "epoch": 0.54, "learning_rate": 2.336568238812106e-06, "loss": 1.0891, "step": 17766 }, { "epoch": 0.54, "learning_rate": 2.336324841307375e-06, "loss": 1.1018, "step": 17767 }, { "epoch": 0.54, "learning_rate": 2.336081445360753e-06, "loss": 1.2016, "step": 17768 }, { "epoch": 0.54, "learning_rate": 2.3358380509745575e-06, "loss": 1.0721, "step": 17769 }, { "epoch": 0.54, "learning_rate": 2.335594658151104e-06, "loss": 1.1385, "step": 17770 }, { "epoch": 0.54, "learning_rate": 2.3353512668927098e-06, "loss": 1.1917, "step": 17771 }, { "epoch": 0.54, "learning_rate": 2.335107877201692e-06, "loss": 1.1124, "step": 17772 }, { "epoch": 0.54, "learning_rate": 2.334864489080369e-06, "loss": 1.1806, "step": 17773 }, { "epoch": 0.54, "learning_rate": 2.3346211025310555e-06, "loss": 1.1123, "step": 17774 }, { "epoch": 0.54, "learning_rate": 2.33437771755607e-06, "loss": 1.0895, "step": 17775 }, { "epoch": 0.54, "learning_rate": 2.334134334157728e-06, "loss": 1.1229, "step": 17776 }, { "epoch": 0.54, "learning_rate": 2.333890952338349e-06, "loss": 1.1307, "step": 17777 }, { "epoch": 0.54, "learning_rate": 2.333647572100247e-06, "loss": 1.1388, "step": 17778 }, { "epoch": 0.54, "learning_rate": 2.3334041934457395e-06, "loss": 1.1141, "step": 17779 }, { "epoch": 0.54, "learning_rate": 2.3331608163771445e-06, "loss": 1.2004, "step": 17780 }, { "epoch": 0.54, "learning_rate": 2.332917440896778e-06, "loss": 1.0439, "step": 17781 }, { "epoch": 0.54, "learning_rate": 2.3326740670069577e-06, "loss": 1.0172, "step": 17782 }, { "epoch": 0.54, "learning_rate": 2.3324306947099988e-06, "loss": 1.0563, "step": 17783 }, { "epoch": 0.54, "learning_rate": 2.3321873240082192e-06, "loss": 1.1443, "step": 17784 }, { "epoch": 0.54, "learning_rate": 2.3319439549039354e-06, "loss": 1.1152, "step": 17785 }, { "epoch": 0.54, "learning_rate": 2.3317005873994647e-06, "loss": 1.2224, "step": 17786 }, { "epoch": 0.54, "learning_rate": 2.3314572214971225e-06, "loss": 1.1412, "step": 17787 }, { "epoch": 0.54, "learning_rate": 2.331213857199227e-06, "loss": 1.1866, "step": 17788 }, { "epoch": 0.54, "learning_rate": 2.3309704945080937e-06, "loss": 1.155, "step": 17789 }, { "epoch": 0.54, "learning_rate": 2.330727133426041e-06, "loss": 1.0405, "step": 17790 }, { "epoch": 0.54, "learning_rate": 2.3304837739553836e-06, "loss": 1.1354, "step": 17791 }, { "epoch": 0.54, "learning_rate": 2.3302404160984394e-06, "loss": 1.018, "step": 17792 }, { "epoch": 0.54, "learning_rate": 2.329997059857524e-06, "loss": 1.3019, "step": 17793 }, { "epoch": 0.54, "learning_rate": 2.329753705234955e-06, "loss": 1.1886, "step": 17794 }, { "epoch": 0.54, "learning_rate": 2.32951035223305e-06, "loss": 1.0532, "step": 17795 }, { "epoch": 0.54, "learning_rate": 2.329267000854123e-06, "loss": 1.0341, "step": 17796 }, { "epoch": 0.54, "learning_rate": 2.329023651100492e-06, "loss": 1.2063, "step": 17797 }, { "epoch": 0.54, "learning_rate": 2.3287803029744737e-06, "loss": 1.2145, "step": 17798 }, { "epoch": 0.54, "learning_rate": 2.3285369564783848e-06, "loss": 1.0399, "step": 17799 }, { "epoch": 0.54, "learning_rate": 2.3282936116145406e-06, "loss": 1.1962, "step": 17800 }, { "epoch": 0.54, "learning_rate": 2.3280502683852596e-06, "loss": 1.1145, "step": 17801 }, { "epoch": 0.54, "learning_rate": 2.3278069267928566e-06, "loss": 1.1523, "step": 17802 }, { "epoch": 0.54, "learning_rate": 2.327563586839649e-06, "loss": 1.0355, "step": 17803 }, { "epoch": 0.54, "learning_rate": 2.327320248527953e-06, "loss": 1.2, "step": 17804 }, { "epoch": 0.54, "learning_rate": 2.3270769118600844e-06, "loss": 1.1721, "step": 17805 }, { "epoch": 0.54, "learning_rate": 2.3268335768383607e-06, "loss": 1.0687, "step": 17806 }, { "epoch": 0.54, "learning_rate": 2.326590243465098e-06, "loss": 1.0189, "step": 17807 }, { "epoch": 0.54, "learning_rate": 2.3263469117426134e-06, "loss": 1.1005, "step": 17808 }, { "epoch": 0.54, "learning_rate": 2.3261035816732216e-06, "loss": 1.0297, "step": 17809 }, { "epoch": 0.54, "learning_rate": 2.32586025325924e-06, "loss": 1.1333, "step": 17810 }, { "epoch": 0.54, "learning_rate": 2.325616926502985e-06, "loss": 1.1912, "step": 17811 }, { "epoch": 0.54, "learning_rate": 2.325373601406774e-06, "loss": 1.1102, "step": 17812 }, { "epoch": 0.54, "learning_rate": 2.325130277972921e-06, "loss": 1.1113, "step": 17813 }, { "epoch": 0.54, "learning_rate": 2.3248869562037437e-06, "loss": 1.1414, "step": 17814 }, { "epoch": 0.54, "learning_rate": 2.324643636101558e-06, "loss": 0.976, "step": 17815 }, { "epoch": 0.54, "learning_rate": 2.324400317668681e-06, "loss": 1.0696, "step": 17816 }, { "epoch": 0.54, "learning_rate": 2.324157000907428e-06, "loss": 1.1455, "step": 17817 }, { "epoch": 0.54, "learning_rate": 2.323913685820116e-06, "loss": 1.0747, "step": 17818 }, { "epoch": 0.54, "learning_rate": 2.3236703724090606e-06, "loss": 1.1501, "step": 17819 }, { "epoch": 0.54, "learning_rate": 2.323427060676578e-06, "loss": 1.0789, "step": 17820 }, { "epoch": 0.54, "learning_rate": 2.323183750624986e-06, "loss": 1.1251, "step": 17821 }, { "epoch": 0.54, "learning_rate": 2.3229404422565987e-06, "loss": 1.2043, "step": 17822 }, { "epoch": 0.54, "learning_rate": 2.3226971355737328e-06, "loss": 1.1062, "step": 17823 }, { "epoch": 0.54, "learning_rate": 2.322453830578705e-06, "loss": 1.2261, "step": 17824 }, { "epoch": 0.54, "learning_rate": 2.3222105272738324e-06, "loss": 1.0837, "step": 17825 }, { "epoch": 0.54, "learning_rate": 2.3219672256614285e-06, "loss": 1.0432, "step": 17826 }, { "epoch": 0.54, "learning_rate": 2.3217239257438114e-06, "loss": 1.1446, "step": 17827 }, { "epoch": 0.54, "learning_rate": 2.3214806275232964e-06, "loss": 1.1395, "step": 17828 }, { "epoch": 0.54, "learning_rate": 2.3212373310022e-06, "loss": 1.1439, "step": 17829 }, { "epoch": 0.54, "learning_rate": 2.3209940361828383e-06, "loss": 1.055, "step": 17830 }, { "epoch": 0.54, "learning_rate": 2.3207507430675263e-06, "loss": 1.127, "step": 17831 }, { "epoch": 0.54, "learning_rate": 2.3205074516585813e-06, "loss": 1.049, "step": 17832 }, { "epoch": 0.54, "learning_rate": 2.3202641619583203e-06, "loss": 1.0928, "step": 17833 }, { "epoch": 0.54, "learning_rate": 2.3200208739690565e-06, "loss": 1.1497, "step": 17834 }, { "epoch": 0.54, "learning_rate": 2.3197775876931075e-06, "loss": 1.1057, "step": 17835 }, { "epoch": 0.54, "learning_rate": 2.319534303132789e-06, "loss": 1.0604, "step": 17836 }, { "epoch": 0.54, "learning_rate": 2.319291020290417e-06, "loss": 1.2037, "step": 17837 }, { "epoch": 0.54, "learning_rate": 2.3190477391683086e-06, "loss": 1.0722, "step": 17838 }, { "epoch": 0.54, "learning_rate": 2.318804459768777e-06, "loss": 1.1259, "step": 17839 }, { "epoch": 0.54, "learning_rate": 2.3185611820941402e-06, "loss": 1.1669, "step": 17840 }, { "epoch": 0.54, "learning_rate": 2.3183179061467136e-06, "loss": 1.0861, "step": 17841 }, { "epoch": 0.54, "learning_rate": 2.3180746319288134e-06, "loss": 1.1639, "step": 17842 }, { "epoch": 0.54, "learning_rate": 2.3178313594427547e-06, "loss": 1.3781, "step": 17843 }, { "epoch": 0.54, "learning_rate": 2.3175880886908532e-06, "loss": 1.1547, "step": 17844 }, { "epoch": 0.54, "learning_rate": 2.3173448196754256e-06, "loss": 1.1589, "step": 17845 }, { "epoch": 0.54, "learning_rate": 2.317101552398789e-06, "loss": 1.1058, "step": 17846 }, { "epoch": 0.54, "learning_rate": 2.3168582868632556e-06, "loss": 1.0426, "step": 17847 }, { "epoch": 0.54, "learning_rate": 2.3166150230711435e-06, "loss": 1.061, "step": 17848 }, { "epoch": 0.54, "learning_rate": 2.316371761024768e-06, "loss": 1.0771, "step": 17849 }, { "epoch": 0.54, "learning_rate": 2.316128500726445e-06, "loss": 1.1023, "step": 17850 }, { "epoch": 0.54, "learning_rate": 2.3158852421784908e-06, "loss": 1.1943, "step": 17851 }, { "epoch": 0.54, "learning_rate": 2.3156419853832198e-06, "loss": 1.0563, "step": 17852 }, { "epoch": 0.54, "learning_rate": 2.315398730342948e-06, "loss": 1.0422, "step": 17853 }, { "epoch": 0.54, "learning_rate": 2.3151554770599916e-06, "loss": 1.1459, "step": 17854 }, { "epoch": 0.54, "learning_rate": 2.3149122255366664e-06, "loss": 1.1348, "step": 17855 }, { "epoch": 0.54, "learning_rate": 2.314668975775287e-06, "loss": 1.1788, "step": 17856 }, { "epoch": 0.54, "learning_rate": 2.31442572777817e-06, "loss": 1.0595, "step": 17857 }, { "epoch": 0.54, "learning_rate": 2.3141824815476306e-06, "loss": 1.0934, "step": 17858 }, { "epoch": 0.54, "learning_rate": 2.3139392370859856e-06, "loss": 1.1241, "step": 17859 }, { "epoch": 0.54, "learning_rate": 2.3136959943955483e-06, "loss": 1.1174, "step": 17860 }, { "epoch": 0.54, "learning_rate": 2.3134527534786354e-06, "loss": 1.0275, "step": 17861 }, { "epoch": 0.54, "learning_rate": 2.3132095143375627e-06, "loss": 1.1516, "step": 17862 }, { "epoch": 0.54, "learning_rate": 2.3129662769746454e-06, "loss": 1.0613, "step": 17863 }, { "epoch": 0.54, "learning_rate": 2.3127230413922e-06, "loss": 1.1399, "step": 17864 }, { "epoch": 0.54, "learning_rate": 2.3124798075925398e-06, "loss": 1.0717, "step": 17865 }, { "epoch": 0.54, "learning_rate": 2.3122365755779817e-06, "loss": 1.1523, "step": 17866 }, { "epoch": 0.54, "learning_rate": 2.311993345350841e-06, "loss": 1.0884, "step": 17867 }, { "epoch": 0.54, "learning_rate": 2.3117501169134335e-06, "loss": 1.1827, "step": 17868 }, { "epoch": 0.54, "learning_rate": 2.3115068902680737e-06, "loss": 1.1401, "step": 17869 }, { "epoch": 0.54, "learning_rate": 2.3112636654170773e-06, "loss": 1.1526, "step": 17870 }, { "epoch": 0.54, "learning_rate": 2.3110204423627607e-06, "loss": 1.1631, "step": 17871 }, { "epoch": 0.54, "learning_rate": 2.3107772211074387e-06, "loss": 1.0922, "step": 17872 }, { "epoch": 0.54, "learning_rate": 2.310534001653426e-06, "loss": 1.1733, "step": 17873 }, { "epoch": 0.54, "learning_rate": 2.3102907840030376e-06, "loss": 1.1143, "step": 17874 }, { "epoch": 0.54, "learning_rate": 2.3100475681585905e-06, "loss": 0.9677, "step": 17875 }, { "epoch": 0.54, "learning_rate": 2.3098043541223986e-06, "loss": 1.087, "step": 17876 }, { "epoch": 0.54, "learning_rate": 2.3095611418967786e-06, "loss": 1.1443, "step": 17877 }, { "epoch": 0.54, "learning_rate": 2.3093179314840437e-06, "loss": 1.108, "step": 17878 }, { "epoch": 0.54, "learning_rate": 2.3090747228865102e-06, "loss": 1.244, "step": 17879 }, { "epoch": 0.54, "learning_rate": 2.308831516106494e-06, "loss": 1.0193, "step": 17880 }, { "epoch": 0.54, "learning_rate": 2.30858831114631e-06, "loss": 1.0667, "step": 17881 }, { "epoch": 0.54, "learning_rate": 2.308345108008272e-06, "loss": 1.0972, "step": 17882 }, { "epoch": 0.54, "learning_rate": 2.3081019066946974e-06, "loss": 1.1454, "step": 17883 }, { "epoch": 0.54, "learning_rate": 2.3078587072078994e-06, "loss": 0.9938, "step": 17884 }, { "epoch": 0.54, "learning_rate": 2.3076155095501945e-06, "loss": 1.1201, "step": 17885 }, { "epoch": 0.54, "learning_rate": 2.3073723137238968e-06, "loss": 1.1588, "step": 17886 }, { "epoch": 0.54, "learning_rate": 2.307129119731322e-06, "loss": 1.0956, "step": 17887 }, { "epoch": 0.54, "learning_rate": 2.3068859275747853e-06, "loss": 1.1949, "step": 17888 }, { "epoch": 0.54, "learning_rate": 2.306642737256601e-06, "loss": 1.1558, "step": 17889 }, { "epoch": 0.54, "learning_rate": 2.306399548779086e-06, "loss": 1.0258, "step": 17890 }, { "epoch": 0.54, "learning_rate": 2.3061563621445533e-06, "loss": 1.0752, "step": 17891 }, { "epoch": 0.54, "learning_rate": 2.3059131773553185e-06, "loss": 1.1754, "step": 17892 }, { "epoch": 0.54, "learning_rate": 2.3056699944136964e-06, "loss": 1.2034, "step": 17893 }, { "epoch": 0.54, "learning_rate": 2.305426813322004e-06, "loss": 1.116, "step": 17894 }, { "epoch": 0.54, "learning_rate": 2.305183634082553e-06, "loss": 1.0852, "step": 17895 }, { "epoch": 0.54, "learning_rate": 2.3049404566976603e-06, "loss": 1.0648, "step": 17896 }, { "epoch": 0.54, "learning_rate": 2.3046972811696407e-06, "loss": 1.1026, "step": 17897 }, { "epoch": 0.54, "learning_rate": 2.3044541075008093e-06, "loss": 1.0375, "step": 17898 }, { "epoch": 0.54, "learning_rate": 2.30421093569348e-06, "loss": 1.0334, "step": 17899 }, { "epoch": 0.54, "learning_rate": 2.303967765749968e-06, "loss": 1.1661, "step": 17900 }, { "epoch": 0.54, "learning_rate": 2.303724597672589e-06, "loss": 1.0857, "step": 17901 }, { "epoch": 0.54, "learning_rate": 2.303481431463657e-06, "loss": 1.0761, "step": 17902 }, { "epoch": 0.54, "learning_rate": 2.303238267125488e-06, "loss": 1.1642, "step": 17903 }, { "epoch": 0.54, "learning_rate": 2.3029951046603954e-06, "loss": 1.1219, "step": 17904 }, { "epoch": 0.54, "learning_rate": 2.3027519440706946e-06, "loss": 1.1416, "step": 17905 }, { "epoch": 0.54, "learning_rate": 2.3025087853587e-06, "loss": 1.1442, "step": 17906 }, { "epoch": 0.54, "learning_rate": 2.3022656285267277e-06, "loss": 1.1573, "step": 17907 }, { "epoch": 0.54, "learning_rate": 2.3020224735770897e-06, "loss": 1.145, "step": 17908 }, { "epoch": 0.54, "learning_rate": 2.3017793205121035e-06, "loss": 1.1876, "step": 17909 }, { "epoch": 0.54, "learning_rate": 2.301536169334082e-06, "loss": 1.0182, "step": 17910 }, { "epoch": 0.54, "learning_rate": 2.3012930200453412e-06, "loss": 1.0781, "step": 17911 }, { "epoch": 0.54, "learning_rate": 2.3010498726481946e-06, "loss": 1.1653, "step": 17912 }, { "epoch": 0.54, "learning_rate": 2.300806727144958e-06, "loss": 1.1747, "step": 17913 }, { "epoch": 0.54, "learning_rate": 2.300563583537945e-06, "loss": 1.1688, "step": 17914 }, { "epoch": 0.54, "learning_rate": 2.3003204418294703e-06, "loss": 1.0754, "step": 17915 }, { "epoch": 0.54, "learning_rate": 2.30007730202185e-06, "loss": 1.1868, "step": 17916 }, { "epoch": 0.54, "learning_rate": 2.299834164117397e-06, "loss": 1.1396, "step": 17917 }, { "epoch": 0.54, "learning_rate": 2.299591028118426e-06, "loss": 1.0947, "step": 17918 }, { "epoch": 0.54, "learning_rate": 2.2993478940272516e-06, "loss": 1.2048, "step": 17919 }, { "epoch": 0.54, "learning_rate": 2.2991047618461897e-06, "loss": 1.1492, "step": 17920 }, { "epoch": 0.54, "learning_rate": 2.298861631577553e-06, "loss": 1.1761, "step": 17921 }, { "epoch": 0.54, "learning_rate": 2.2986185032236567e-06, "loss": 1.0856, "step": 17922 }, { "epoch": 0.54, "learning_rate": 2.298375376786815e-06, "loss": 1.1476, "step": 17923 }, { "epoch": 0.54, "learning_rate": 2.2981322522693435e-06, "loss": 1.285, "step": 17924 }, { "epoch": 0.54, "learning_rate": 2.2978891296735546e-06, "loss": 1.1172, "step": 17925 }, { "epoch": 0.54, "learning_rate": 2.2976460090017645e-06, "loss": 1.1146, "step": 17926 }, { "epoch": 0.54, "learning_rate": 2.2974028902562862e-06, "loss": 1.0789, "step": 17927 }, { "epoch": 0.54, "learning_rate": 2.297159773439436e-06, "loss": 1.0423, "step": 17928 }, { "epoch": 0.54, "learning_rate": 2.296916658553527e-06, "loss": 1.1729, "step": 17929 }, { "epoch": 0.54, "learning_rate": 2.296673545600873e-06, "loss": 1.0632, "step": 17930 }, { "epoch": 0.54, "learning_rate": 2.296430434583789e-06, "loss": 1.114, "step": 17931 }, { "epoch": 0.54, "learning_rate": 2.2961873255045888e-06, "loss": 1.0713, "step": 17932 }, { "epoch": 0.54, "learning_rate": 2.2959442183655887e-06, "loss": 1.1425, "step": 17933 }, { "epoch": 0.54, "learning_rate": 2.2957011131691e-06, "loss": 1.1416, "step": 17934 }, { "epoch": 0.54, "learning_rate": 2.2954580099174382e-06, "loss": 1.264, "step": 17935 }, { "epoch": 0.54, "learning_rate": 2.2952149086129176e-06, "loss": 1.246, "step": 17936 }, { "epoch": 0.54, "learning_rate": 2.294971809257853e-06, "loss": 1.1634, "step": 17937 }, { "epoch": 0.54, "learning_rate": 2.294728711854558e-06, "loss": 1.0889, "step": 17938 }, { "epoch": 0.54, "learning_rate": 2.2944856164053465e-06, "loss": 1.1234, "step": 17939 }, { "epoch": 0.54, "learning_rate": 2.294242522912533e-06, "loss": 1.0488, "step": 17940 }, { "epoch": 0.54, "learning_rate": 2.2939994313784316e-06, "loss": 1.0948, "step": 17941 }, { "epoch": 0.54, "learning_rate": 2.293756341805357e-06, "loss": 1.0878, "step": 17942 }, { "epoch": 0.54, "learning_rate": 2.293513254195622e-06, "loss": 1.1338, "step": 17943 }, { "epoch": 0.54, "learning_rate": 2.2932701685515416e-06, "loss": 1.1278, "step": 17944 }, { "epoch": 0.54, "learning_rate": 2.293027084875429e-06, "loss": 1.1636, "step": 17945 }, { "epoch": 0.54, "learning_rate": 2.292784003169601e-06, "loss": 1.1552, "step": 17946 }, { "epoch": 0.54, "learning_rate": 2.292540923436367e-06, "loss": 1.0325, "step": 17947 }, { "epoch": 0.54, "learning_rate": 2.292297845678045e-06, "loss": 1.1451, "step": 17948 }, { "epoch": 0.54, "learning_rate": 2.2920547698969462e-06, "loss": 1.1627, "step": 17949 }, { "epoch": 0.54, "learning_rate": 2.2918116960953872e-06, "loss": 1.0489, "step": 17950 }, { "epoch": 0.54, "learning_rate": 2.2915686242756795e-06, "loss": 1.1661, "step": 17951 }, { "epoch": 0.54, "learning_rate": 2.291325554440139e-06, "loss": 1.1182, "step": 17952 }, { "epoch": 0.54, "learning_rate": 2.2910824865910776e-06, "loss": 1.1021, "step": 17953 }, { "epoch": 0.54, "learning_rate": 2.2908394207308107e-06, "loss": 1.0729, "step": 17954 }, { "epoch": 0.54, "learning_rate": 2.290596356861653e-06, "loss": 1.1447, "step": 17955 }, { "epoch": 0.54, "learning_rate": 2.290353294985916e-06, "loss": 1.1754, "step": 17956 }, { "epoch": 0.54, "learning_rate": 2.2901102351059146e-06, "loss": 1.0977, "step": 17957 }, { "epoch": 0.54, "learning_rate": 2.289867177223963e-06, "loss": 1.1412, "step": 17958 }, { "epoch": 0.54, "learning_rate": 2.289624121342375e-06, "loss": 1.1151, "step": 17959 }, { "epoch": 0.54, "learning_rate": 2.2893810674634635e-06, "loss": 1.0294, "step": 17960 }, { "epoch": 0.54, "learning_rate": 2.289138015589543e-06, "loss": 1.1173, "step": 17961 }, { "epoch": 0.54, "learning_rate": 2.2888949657229266e-06, "loss": 1.1387, "step": 17962 }, { "epoch": 0.54, "learning_rate": 2.2886519178659296e-06, "loss": 1.0193, "step": 17963 }, { "epoch": 0.54, "learning_rate": 2.2884088720208637e-06, "loss": 1.1984, "step": 17964 }, { "epoch": 0.54, "learning_rate": 2.2881658281900434e-06, "loss": 1.0898, "step": 17965 }, { "epoch": 0.54, "learning_rate": 2.2879227863757824e-06, "loss": 1.0623, "step": 17966 }, { "epoch": 0.54, "learning_rate": 2.2876797465803943e-06, "loss": 1.1184, "step": 17967 }, { "epoch": 0.54, "learning_rate": 2.2874367088061933e-06, "loss": 1.2573, "step": 17968 }, { "epoch": 0.54, "learning_rate": 2.287193673055492e-06, "loss": 1.1638, "step": 17969 }, { "epoch": 0.54, "learning_rate": 2.2869506393306042e-06, "loss": 1.096, "step": 17970 }, { "epoch": 0.54, "learning_rate": 2.286707607633844e-06, "loss": 1.0582, "step": 17971 }, { "epoch": 0.54, "learning_rate": 2.2864645779675253e-06, "loss": 1.1683, "step": 17972 }, { "epoch": 0.54, "learning_rate": 2.2862215503339604e-06, "loss": 1.06, "step": 17973 }, { "epoch": 0.54, "learning_rate": 2.285978524735463e-06, "loss": 1.1022, "step": 17974 }, { "epoch": 0.54, "learning_rate": 2.2857355011743472e-06, "loss": 1.1902, "step": 17975 }, { "epoch": 0.54, "learning_rate": 2.2854924796529264e-06, "loss": 1.0507, "step": 17976 }, { "epoch": 0.54, "learning_rate": 2.2852494601735143e-06, "loss": 1.0672, "step": 17977 }, { "epoch": 0.54, "learning_rate": 2.2850064427384234e-06, "loss": 1.1664, "step": 17978 }, { "epoch": 0.54, "learning_rate": 2.284763427349967e-06, "loss": 1.11, "step": 17979 }, { "epoch": 0.54, "learning_rate": 2.28452041401046e-06, "loss": 1.1002, "step": 17980 }, { "epoch": 0.54, "learning_rate": 2.284277402722215e-06, "loss": 1.0376, "step": 17981 }, { "epoch": 0.54, "learning_rate": 2.2840343934875443e-06, "loss": 1.1178, "step": 17982 }, { "epoch": 0.54, "learning_rate": 2.2837913863087625e-06, "loss": 1.0887, "step": 17983 }, { "epoch": 0.54, "learning_rate": 2.2835483811881826e-06, "loss": 1.1103, "step": 17984 }, { "epoch": 0.54, "learning_rate": 2.2833053781281193e-06, "loss": 1.0372, "step": 17985 }, { "epoch": 0.54, "learning_rate": 2.283062377130883e-06, "loss": 1.1641, "step": 17986 }, { "epoch": 0.54, "learning_rate": 2.2828193781987882e-06, "loss": 1.2638, "step": 17987 }, { "epoch": 0.54, "learning_rate": 2.2825763813341487e-06, "loss": 1.1404, "step": 17988 }, { "epoch": 0.54, "learning_rate": 2.2823333865392783e-06, "loss": 1.0997, "step": 17989 }, { "epoch": 0.54, "learning_rate": 2.282090393816488e-06, "loss": 0.9881, "step": 17990 }, { "epoch": 0.54, "learning_rate": 2.281847403168092e-06, "loss": 1.0866, "step": 17991 }, { "epoch": 0.54, "learning_rate": 2.2816044145964044e-06, "loss": 1.0726, "step": 17992 }, { "epoch": 0.54, "learning_rate": 2.2813614281037367e-06, "loss": 1.1799, "step": 17993 }, { "epoch": 0.54, "learning_rate": 2.2811184436924043e-06, "loss": 1.1099, "step": 17994 }, { "epoch": 0.54, "learning_rate": 2.280875461364718e-06, "loss": 1.1019, "step": 17995 }, { "epoch": 0.54, "learning_rate": 2.280632481122991e-06, "loss": 1.1669, "step": 17996 }, { "epoch": 0.54, "learning_rate": 2.2803895029695385e-06, "loss": 1.0225, "step": 17997 }, { "epoch": 0.54, "learning_rate": 2.280146526906672e-06, "loss": 1.0673, "step": 17998 }, { "epoch": 0.54, "learning_rate": 2.2799035529367047e-06, "loss": 1.1801, "step": 17999 }, { "epoch": 0.54, "learning_rate": 2.2796605810619486e-06, "loss": 1.213, "step": 18000 }, { "epoch": 0.54, "learning_rate": 2.2794176112847185e-06, "loss": 1.1671, "step": 18001 }, { "epoch": 0.54, "learning_rate": 2.279174643607327e-06, "loss": 1.2006, "step": 18002 }, { "epoch": 0.54, "learning_rate": 2.2789316780320854e-06, "loss": 1.1066, "step": 18003 }, { "epoch": 0.54, "learning_rate": 2.2786887145613082e-06, "loss": 1.1656, "step": 18004 }, { "epoch": 0.54, "learning_rate": 2.2784457531973073e-06, "loss": 1.1382, "step": 18005 }, { "epoch": 0.54, "learning_rate": 2.278202793942397e-06, "loss": 1.2499, "step": 18006 }, { "epoch": 0.54, "learning_rate": 2.2779598367988893e-06, "loss": 1.0899, "step": 18007 }, { "epoch": 0.54, "learning_rate": 2.2777168817690966e-06, "loss": 1.1957, "step": 18008 }, { "epoch": 0.54, "learning_rate": 2.2774739288553314e-06, "loss": 1.1103, "step": 18009 }, { "epoch": 0.54, "learning_rate": 2.277230978059908e-06, "loss": 1.0168, "step": 18010 }, { "epoch": 0.54, "learning_rate": 2.276988029385139e-06, "loss": 1.1492, "step": 18011 }, { "epoch": 0.54, "learning_rate": 2.2767450828333364e-06, "loss": 1.0789, "step": 18012 }, { "epoch": 0.54, "learning_rate": 2.276502138406812e-06, "loss": 1.105, "step": 18013 }, { "epoch": 0.54, "learning_rate": 2.27625919610788e-06, "loss": 1.113, "step": 18014 }, { "epoch": 0.54, "learning_rate": 2.2760162559388544e-06, "loss": 1.1089, "step": 18015 }, { "epoch": 0.54, "learning_rate": 2.2757733179020443e-06, "loss": 1.0838, "step": 18016 }, { "epoch": 0.54, "learning_rate": 2.2755303819997645e-06, "loss": 1.1396, "step": 18017 }, { "epoch": 0.54, "learning_rate": 2.2752874482343273e-06, "loss": 1.1951, "step": 18018 }, { "epoch": 0.54, "learning_rate": 2.275044516608046e-06, "loss": 0.9342, "step": 18019 }, { "epoch": 0.54, "learning_rate": 2.2748015871232316e-06, "loss": 1.1271, "step": 18020 }, { "epoch": 0.54, "learning_rate": 2.274558659782198e-06, "loss": 1.1769, "step": 18021 }, { "epoch": 0.54, "learning_rate": 2.2743157345872573e-06, "loss": 1.1077, "step": 18022 }, { "epoch": 0.54, "learning_rate": 2.2740728115407222e-06, "loss": 1.1451, "step": 18023 }, { "epoch": 0.54, "learning_rate": 2.2738298906449063e-06, "loss": 1.1132, "step": 18024 }, { "epoch": 0.54, "learning_rate": 2.2735869719021197e-06, "loss": 1.1983, "step": 18025 }, { "epoch": 0.54, "learning_rate": 2.2733440553146763e-06, "loss": 1.0949, "step": 18026 }, { "epoch": 0.54, "learning_rate": 2.273101140884888e-06, "loss": 0.9958, "step": 18027 }, { "epoch": 0.54, "learning_rate": 2.2728582286150687e-06, "loss": 1.0139, "step": 18028 }, { "epoch": 0.54, "learning_rate": 2.2726153185075285e-06, "loss": 1.1438, "step": 18029 }, { "epoch": 0.54, "learning_rate": 2.2723724105645815e-06, "loss": 1.2711, "step": 18030 }, { "epoch": 0.54, "learning_rate": 2.272129504788539e-06, "loss": 1.0338, "step": 18031 }, { "epoch": 0.54, "learning_rate": 2.2718866011817146e-06, "loss": 1.0909, "step": 18032 }, { "epoch": 0.54, "learning_rate": 2.271643699746419e-06, "loss": 1.1151, "step": 18033 }, { "epoch": 0.54, "learning_rate": 2.2714008004849657e-06, "loss": 1.2095, "step": 18034 }, { "epoch": 0.54, "learning_rate": 2.271157903399667e-06, "loss": 1.0557, "step": 18035 }, { "epoch": 0.54, "learning_rate": 2.2709150084928342e-06, "loss": 1.105, "step": 18036 }, { "epoch": 0.54, "learning_rate": 2.2706721157667815e-06, "loss": 1.3624, "step": 18037 }, { "epoch": 0.54, "learning_rate": 2.270429225223819e-06, "loss": 1.1249, "step": 18038 }, { "epoch": 0.54, "learning_rate": 2.2701863368662596e-06, "loss": 1.033, "step": 18039 }, { "epoch": 0.54, "learning_rate": 2.2699434506964156e-06, "loss": 0.9906, "step": 18040 }, { "epoch": 0.54, "learning_rate": 2.2697005667166e-06, "loss": 1.1824, "step": 18041 }, { "epoch": 0.54, "learning_rate": 2.269457684929123e-06, "loss": 1.1722, "step": 18042 }, { "epoch": 0.54, "learning_rate": 2.269214805336298e-06, "loss": 1.1271, "step": 18043 }, { "epoch": 0.54, "learning_rate": 2.268971927940437e-06, "loss": 1.1633, "step": 18044 }, { "epoch": 0.54, "learning_rate": 2.2687290527438524e-06, "loss": 1.0611, "step": 18045 }, { "epoch": 0.54, "learning_rate": 2.2684861797488554e-06, "loss": 1.022, "step": 18046 }, { "epoch": 0.54, "learning_rate": 2.268243308957758e-06, "loss": 1.2524, "step": 18047 }, { "epoch": 0.54, "learning_rate": 2.2680004403728737e-06, "loss": 1.0893, "step": 18048 }, { "epoch": 0.54, "learning_rate": 2.2677575739965125e-06, "loss": 1.1204, "step": 18049 }, { "epoch": 0.54, "learning_rate": 2.2675147098309886e-06, "loss": 1.1778, "step": 18050 }, { "epoch": 0.54, "learning_rate": 2.2672718478786115e-06, "loss": 1.2583, "step": 18051 }, { "epoch": 0.54, "learning_rate": 2.2670289881416944e-06, "loss": 1.1497, "step": 18052 }, { "epoch": 0.54, "learning_rate": 2.2667861306225492e-06, "loss": 1.2189, "step": 18053 }, { "epoch": 0.54, "learning_rate": 2.2665432753234893e-06, "loss": 1.1579, "step": 18054 }, { "epoch": 0.54, "learning_rate": 2.2663004222468236e-06, "loss": 1.1885, "step": 18055 }, { "epoch": 0.54, "learning_rate": 2.2660575713948653e-06, "loss": 1.2435, "step": 18056 }, { "epoch": 0.54, "learning_rate": 2.265814722769926e-06, "loss": 1.0852, "step": 18057 }, { "epoch": 0.54, "learning_rate": 2.2655718763743183e-06, "loss": 1.2139, "step": 18058 }, { "epoch": 0.54, "learning_rate": 2.2653290322103534e-06, "loss": 1.0938, "step": 18059 }, { "epoch": 0.54, "learning_rate": 2.2650861902803427e-06, "loss": 1.093, "step": 18060 }, { "epoch": 0.54, "learning_rate": 2.2648433505865985e-06, "loss": 1.0687, "step": 18061 }, { "epoch": 0.54, "learning_rate": 2.2646005131314324e-06, "loss": 1.179, "step": 18062 }, { "epoch": 0.54, "learning_rate": 2.2643576779171562e-06, "loss": 1.0114, "step": 18063 }, { "epoch": 0.54, "learning_rate": 2.2641148449460813e-06, "loss": 1.1006, "step": 18064 }, { "epoch": 0.54, "learning_rate": 2.263872014220519e-06, "loss": 1.0641, "step": 18065 }, { "epoch": 0.54, "learning_rate": 2.2636291857427815e-06, "loss": 1.0594, "step": 18066 }, { "epoch": 0.54, "learning_rate": 2.2633863595151815e-06, "loss": 1.0418, "step": 18067 }, { "epoch": 0.54, "learning_rate": 2.263143535540029e-06, "loss": 1.1778, "step": 18068 }, { "epoch": 0.54, "learning_rate": 2.262900713819635e-06, "loss": 1.1264, "step": 18069 }, { "epoch": 0.54, "learning_rate": 2.2626578943563123e-06, "loss": 1.1305, "step": 18070 }, { "epoch": 0.54, "learning_rate": 2.2624150771523733e-06, "loss": 1.0362, "step": 18071 }, { "epoch": 0.54, "learning_rate": 2.2621722622101274e-06, "loss": 1.1409, "step": 18072 }, { "epoch": 0.54, "learning_rate": 2.2619294495318866e-06, "loss": 1.0719, "step": 18073 }, { "epoch": 0.54, "learning_rate": 2.2616866391199634e-06, "loss": 1.0665, "step": 18074 }, { "epoch": 0.54, "learning_rate": 2.261443830976668e-06, "loss": 1.2274, "step": 18075 }, { "epoch": 0.54, "learning_rate": 2.2612010251043132e-06, "loss": 1.0765, "step": 18076 }, { "epoch": 0.54, "learning_rate": 2.260958221505209e-06, "loss": 1.1395, "step": 18077 }, { "epoch": 0.54, "learning_rate": 2.2607154201816676e-06, "loss": 1.0714, "step": 18078 }, { "epoch": 0.54, "learning_rate": 2.260472621136e-06, "loss": 1.149, "step": 18079 }, { "epoch": 0.54, "learning_rate": 2.260229824370519e-06, "loss": 1.1862, "step": 18080 }, { "epoch": 0.54, "learning_rate": 2.2599870298875332e-06, "loss": 1.1392, "step": 18081 }, { "epoch": 0.54, "learning_rate": 2.2597442376893556e-06, "loss": 1.2115, "step": 18082 }, { "epoch": 0.54, "learning_rate": 2.2595014477782966e-06, "loss": 1.0696, "step": 18083 }, { "epoch": 0.54, "learning_rate": 2.2592586601566694e-06, "loss": 1.0773, "step": 18084 }, { "epoch": 0.54, "learning_rate": 2.259015874826783e-06, "loss": 1.1665, "step": 18085 }, { "epoch": 0.54, "learning_rate": 2.2587730917909494e-06, "loss": 1.0889, "step": 18086 }, { "epoch": 0.54, "learning_rate": 2.2585303110514793e-06, "loss": 1.3147, "step": 18087 }, { "epoch": 0.54, "learning_rate": 2.2582875326106846e-06, "loss": 1.2256, "step": 18088 }, { "epoch": 0.54, "learning_rate": 2.258044756470877e-06, "loss": 1.1449, "step": 18089 }, { "epoch": 0.54, "learning_rate": 2.257801982634366e-06, "loss": 1.1347, "step": 18090 }, { "epoch": 0.54, "learning_rate": 2.257559211103463e-06, "loss": 1.0779, "step": 18091 }, { "epoch": 0.55, "learning_rate": 2.2573164418804804e-06, "loss": 1.0465, "step": 18092 }, { "epoch": 0.55, "learning_rate": 2.257073674967729e-06, "loss": 1.136, "step": 18093 }, { "epoch": 0.55, "learning_rate": 2.256830910367518e-06, "loss": 1.0714, "step": 18094 }, { "epoch": 0.55, "learning_rate": 2.25658814808216e-06, "loss": 1.167, "step": 18095 }, { "epoch": 0.55, "learning_rate": 2.2563453881139655e-06, "loss": 1.0149, "step": 18096 }, { "epoch": 0.55, "learning_rate": 2.2561026304652467e-06, "loss": 1.2555, "step": 18097 }, { "epoch": 0.55, "learning_rate": 2.255859875138312e-06, "loss": 1.1705, "step": 18098 }, { "epoch": 0.55, "learning_rate": 2.2556171221354737e-06, "loss": 1.1713, "step": 18099 }, { "epoch": 0.55, "learning_rate": 2.255374371459043e-06, "loss": 1.1959, "step": 18100 }, { "epoch": 0.55, "learning_rate": 2.2551316231113305e-06, "loss": 1.1097, "step": 18101 }, { "epoch": 0.55, "learning_rate": 2.2548888770946475e-06, "loss": 1.0309, "step": 18102 }, { "epoch": 0.55, "learning_rate": 2.254646133411304e-06, "loss": 1.0237, "step": 18103 }, { "epoch": 0.55, "learning_rate": 2.2544033920636105e-06, "loss": 1.177, "step": 18104 }, { "epoch": 0.55, "learning_rate": 2.2541606530538788e-06, "loss": 1.158, "step": 18105 }, { "epoch": 0.55, "learning_rate": 2.2539179163844203e-06, "loss": 1.2885, "step": 18106 }, { "epoch": 0.55, "learning_rate": 2.2536751820575437e-06, "loss": 1.2416, "step": 18107 }, { "epoch": 0.55, "learning_rate": 2.253432450075561e-06, "loss": 1.103, "step": 18108 }, { "epoch": 0.55, "learning_rate": 2.2531897204407822e-06, "loss": 1.1451, "step": 18109 }, { "epoch": 0.55, "learning_rate": 2.2529469931555197e-06, "loss": 1.1119, "step": 18110 }, { "epoch": 0.55, "learning_rate": 2.2527042682220813e-06, "loss": 1.0897, "step": 18111 }, { "epoch": 0.55, "learning_rate": 2.2524615456427796e-06, "loss": 1.1478, "step": 18112 }, { "epoch": 0.55, "learning_rate": 2.252218825419925e-06, "loss": 0.9619, "step": 18113 }, { "epoch": 0.55, "learning_rate": 2.2519761075558273e-06, "loss": 1.1378, "step": 18114 }, { "epoch": 0.55, "learning_rate": 2.2517333920527985e-06, "loss": 1.0628, "step": 18115 }, { "epoch": 0.55, "learning_rate": 2.251490678913148e-06, "loss": 1.2644, "step": 18116 }, { "epoch": 0.55, "learning_rate": 2.251247968139186e-06, "loss": 1.1713, "step": 18117 }, { "epoch": 0.55, "learning_rate": 2.2510052597332237e-06, "loss": 1.1979, "step": 18118 }, { "epoch": 0.55, "learning_rate": 2.250762553697572e-06, "loss": 1.0833, "step": 18119 }, { "epoch": 0.55, "learning_rate": 2.2505198500345404e-06, "loss": 1.1165, "step": 18120 }, { "epoch": 0.55, "learning_rate": 2.2502771487464393e-06, "loss": 1.1527, "step": 18121 }, { "epoch": 0.55, "learning_rate": 2.2500344498355798e-06, "loss": 1.1602, "step": 18122 }, { "epoch": 0.55, "learning_rate": 2.2497917533042725e-06, "loss": 1.2247, "step": 18123 }, { "epoch": 0.55, "learning_rate": 2.2495490591548266e-06, "loss": 1.1793, "step": 18124 }, { "epoch": 0.55, "learning_rate": 2.249306367389553e-06, "loss": 1.0504, "step": 18125 }, { "epoch": 0.55, "learning_rate": 2.249063678010762e-06, "loss": 1.0657, "step": 18126 }, { "epoch": 0.55, "learning_rate": 2.2488209910207637e-06, "loss": 1.1174, "step": 18127 }, { "epoch": 0.55, "learning_rate": 2.2485783064218692e-06, "loss": 1.1944, "step": 18128 }, { "epoch": 0.55, "learning_rate": 2.248335624216388e-06, "loss": 1.1447, "step": 18129 }, { "epoch": 0.55, "learning_rate": 2.2480929444066304e-06, "loss": 1.1688, "step": 18130 }, { "epoch": 0.55, "learning_rate": 2.2478502669949066e-06, "loss": 1.2103, "step": 18131 }, { "epoch": 0.55, "learning_rate": 2.247607591983527e-06, "loss": 1.0257, "step": 18132 }, { "epoch": 0.55, "learning_rate": 2.2473649193748013e-06, "loss": 1.0659, "step": 18133 }, { "epoch": 0.55, "learning_rate": 2.2471222491710394e-06, "loss": 1.075, "step": 18134 }, { "epoch": 0.55, "learning_rate": 2.2468795813745524e-06, "loss": 1.1161, "step": 18135 }, { "epoch": 0.55, "learning_rate": 2.246636915987651e-06, "loss": 1.2588, "step": 18136 }, { "epoch": 0.55, "learning_rate": 2.246394253012643e-06, "loss": 1.224, "step": 18137 }, { "epoch": 0.55, "learning_rate": 2.246151592451839e-06, "loss": 1.1235, "step": 18138 }, { "epoch": 0.55, "learning_rate": 2.24590893430755e-06, "loss": 1.1529, "step": 18139 }, { "epoch": 0.55, "learning_rate": 2.245666278582086e-06, "loss": 1.1209, "step": 18140 }, { "epoch": 0.55, "learning_rate": 2.245423625277757e-06, "loss": 1.1331, "step": 18141 }, { "epoch": 0.55, "learning_rate": 2.2451809743968717e-06, "loss": 1.1258, "step": 18142 }, { "epoch": 0.55, "learning_rate": 2.244938325941741e-06, "loss": 1.177, "step": 18143 }, { "epoch": 0.55, "learning_rate": 2.244695679914674e-06, "loss": 1.0956, "step": 18144 }, { "epoch": 0.55, "learning_rate": 2.244453036317982e-06, "loss": 1.0844, "step": 18145 }, { "epoch": 0.55, "learning_rate": 2.2442103951539734e-06, "loss": 1.0637, "step": 18146 }, { "epoch": 0.55, "learning_rate": 2.243967756424959e-06, "loss": 1.1022, "step": 18147 }, { "epoch": 0.55, "learning_rate": 2.243725120133248e-06, "loss": 1.1523, "step": 18148 }, { "epoch": 0.55, "learning_rate": 2.2434824862811514e-06, "loss": 1.1696, "step": 18149 }, { "epoch": 0.55, "learning_rate": 2.2432398548709768e-06, "loss": 1.3004, "step": 18150 }, { "epoch": 0.55, "learning_rate": 2.2429972259050356e-06, "loss": 1.2695, "step": 18151 }, { "epoch": 0.55, "learning_rate": 2.242754599385637e-06, "loss": 1.142, "step": 18152 }, { "epoch": 0.55, "learning_rate": 2.24251197531509e-06, "loss": 1.1802, "step": 18153 }, { "epoch": 0.55, "learning_rate": 2.242269353695707e-06, "loss": 1.214, "step": 18154 }, { "epoch": 0.55, "learning_rate": 2.2420267345297938e-06, "loss": 1.1429, "step": 18155 }, { "epoch": 0.55, "learning_rate": 2.241784117819662e-06, "loss": 1.1921, "step": 18156 }, { "epoch": 0.55, "learning_rate": 2.2415415035676213e-06, "loss": 1.0579, "step": 18157 }, { "epoch": 0.55, "learning_rate": 2.2412988917759816e-06, "loss": 1.1044, "step": 18158 }, { "epoch": 0.55, "learning_rate": 2.241056282447051e-06, "loss": 1.1172, "step": 18159 }, { "epoch": 0.55, "learning_rate": 2.24081367558314e-06, "loss": 1.1254, "step": 18160 }, { "epoch": 0.55, "learning_rate": 2.240571071186558e-06, "loss": 1.1398, "step": 18161 }, { "epoch": 0.55, "learning_rate": 2.2403284692596154e-06, "loss": 1.3174, "step": 18162 }, { "epoch": 0.55, "learning_rate": 2.2400858698046197e-06, "loss": 1.0944, "step": 18163 }, { "epoch": 0.55, "learning_rate": 2.239843272823882e-06, "loss": 1.0549, "step": 18164 }, { "epoch": 0.55, "learning_rate": 2.23960067831971e-06, "loss": 1.1512, "step": 18165 }, { "epoch": 0.55, "learning_rate": 2.2393580862944146e-06, "loss": 1.2327, "step": 18166 }, { "epoch": 0.55, "learning_rate": 2.2391154967503058e-06, "loss": 1.1483, "step": 18167 }, { "epoch": 0.55, "learning_rate": 2.238872909689691e-06, "loss": 1.0481, "step": 18168 }, { "epoch": 0.55, "learning_rate": 2.2386303251148795e-06, "loss": 1.1304, "step": 18169 }, { "epoch": 0.55, "learning_rate": 2.238387743028182e-06, "loss": 1.1703, "step": 18170 }, { "epoch": 0.55, "learning_rate": 2.238145163431908e-06, "loss": 1.1714, "step": 18171 }, { "epoch": 0.55, "learning_rate": 2.237902586328365e-06, "loss": 1.0381, "step": 18172 }, { "epoch": 0.55, "learning_rate": 2.2376600117198633e-06, "loss": 1.1143, "step": 18173 }, { "epoch": 0.55, "learning_rate": 2.2374174396087116e-06, "loss": 1.0318, "step": 18174 }, { "epoch": 0.55, "learning_rate": 2.237174869997221e-06, "loss": 1.1017, "step": 18175 }, { "epoch": 0.55, "learning_rate": 2.2369323028876975e-06, "loss": 1.0161, "step": 18176 }, { "epoch": 0.55, "learning_rate": 2.236689738282452e-06, "loss": 1.0616, "step": 18177 }, { "epoch": 0.55, "learning_rate": 2.2364471761837938e-06, "loss": 1.0883, "step": 18178 }, { "epoch": 0.55, "learning_rate": 2.236204616594031e-06, "loss": 1.0753, "step": 18179 }, { "epoch": 0.55, "learning_rate": 2.235962059515474e-06, "loss": 1.1227, "step": 18180 }, { "epoch": 0.55, "learning_rate": 2.2357195049504307e-06, "loss": 1.0605, "step": 18181 }, { "epoch": 0.55, "learning_rate": 2.2354769529012103e-06, "loss": 1.1638, "step": 18182 }, { "epoch": 0.55, "learning_rate": 2.2352344033701214e-06, "loss": 1.1682, "step": 18183 }, { "epoch": 0.55, "learning_rate": 2.2349918563594743e-06, "loss": 1.1962, "step": 18184 }, { "epoch": 0.55, "learning_rate": 2.2347493118715764e-06, "loss": 1.1326, "step": 18185 }, { "epoch": 0.55, "learning_rate": 2.234506769908738e-06, "loss": 1.1771, "step": 18186 }, { "epoch": 0.55, "learning_rate": 2.2342642304732665e-06, "loss": 1.2105, "step": 18187 }, { "epoch": 0.55, "learning_rate": 2.234021693567473e-06, "loss": 1.159, "step": 18188 }, { "epoch": 0.55, "learning_rate": 2.2337791591936635e-06, "loss": 1.0989, "step": 18189 }, { "epoch": 0.55, "learning_rate": 2.2335366273541486e-06, "loss": 1.1007, "step": 18190 }, { "epoch": 0.55, "learning_rate": 2.2332940980512364e-06, "loss": 1.0942, "step": 18191 }, { "epoch": 0.55, "learning_rate": 2.2330515712872357e-06, "loss": 1.2333, "step": 18192 }, { "epoch": 0.55, "learning_rate": 2.232809047064457e-06, "loss": 1.1214, "step": 18193 }, { "epoch": 0.55, "learning_rate": 2.2325665253852065e-06, "loss": 1.0551, "step": 18194 }, { "epoch": 0.55, "learning_rate": 2.2323240062517935e-06, "loss": 1.124, "step": 18195 }, { "epoch": 0.55, "learning_rate": 2.232081489666527e-06, "loss": 1.147, "step": 18196 }, { "epoch": 0.55, "learning_rate": 2.2318389756317163e-06, "loss": 1.0103, "step": 18197 }, { "epoch": 0.55, "learning_rate": 2.231596464149669e-06, "loss": 1.05, "step": 18198 }, { "epoch": 0.55, "learning_rate": 2.231353955222694e-06, "loss": 1.1548, "step": 18199 }, { "epoch": 0.55, "learning_rate": 2.2311114488531e-06, "loss": 1.1702, "step": 18200 }, { "epoch": 0.55, "learning_rate": 2.2308689450431966e-06, "loss": 1.207, "step": 18201 }, { "epoch": 0.55, "learning_rate": 2.23062644379529e-06, "loss": 1.0757, "step": 18202 }, { "epoch": 0.55, "learning_rate": 2.2303839451116906e-06, "loss": 1.0292, "step": 18203 }, { "epoch": 0.55, "learning_rate": 2.2301414489947056e-06, "loss": 1.0344, "step": 18204 }, { "epoch": 0.55, "learning_rate": 2.229898955446645e-06, "loss": 1.1364, "step": 18205 }, { "epoch": 0.55, "learning_rate": 2.2296564644698154e-06, "loss": 1.164, "step": 18206 }, { "epoch": 0.55, "learning_rate": 2.229413976066526e-06, "loss": 1.1914, "step": 18207 }, { "epoch": 0.55, "learning_rate": 2.229171490239085e-06, "loss": 1.1476, "step": 18208 }, { "epoch": 0.55, "learning_rate": 2.228929006989801e-06, "loss": 1.1157, "step": 18209 }, { "epoch": 0.55, "learning_rate": 2.2286865263209835e-06, "loss": 1.2153, "step": 18210 }, { "epoch": 0.55, "learning_rate": 2.2284440482349384e-06, "loss": 1.162, "step": 18211 }, { "epoch": 0.55, "learning_rate": 2.2282015727339755e-06, "loss": 1.129, "step": 18212 }, { "epoch": 0.55, "learning_rate": 2.227959099820403e-06, "loss": 1.1063, "step": 18213 }, { "epoch": 0.55, "learning_rate": 2.227716629496529e-06, "loss": 1.1014, "step": 18214 }, { "epoch": 0.55, "learning_rate": 2.227474161764661e-06, "loss": 1.1428, "step": 18215 }, { "epoch": 0.55, "learning_rate": 2.227231696627108e-06, "loss": 0.9728, "step": 18216 }, { "epoch": 0.55, "learning_rate": 2.2269892340861773e-06, "loss": 1.1572, "step": 18217 }, { "epoch": 0.55, "learning_rate": 2.2267467741441793e-06, "loss": 1.1149, "step": 18218 }, { "epoch": 0.55, "learning_rate": 2.226504316803419e-06, "loss": 1.0927, "step": 18219 }, { "epoch": 0.55, "learning_rate": 2.226261862066206e-06, "loss": 1.1023, "step": 18220 }, { "epoch": 0.55, "learning_rate": 2.2260194099348478e-06, "loss": 1.16, "step": 18221 }, { "epoch": 0.55, "learning_rate": 2.225776960411653e-06, "loss": 1.0045, "step": 18222 }, { "epoch": 0.55, "learning_rate": 2.2255345134989306e-06, "loss": 1.1438, "step": 18223 }, { "epoch": 0.55, "learning_rate": 2.225292069198987e-06, "loss": 1.0531, "step": 18224 }, { "epoch": 0.55, "learning_rate": 2.22504962751413e-06, "loss": 1.2114, "step": 18225 }, { "epoch": 0.55, "learning_rate": 2.224807188446668e-06, "loss": 1.1076, "step": 18226 }, { "epoch": 0.55, "learning_rate": 2.22456475199891e-06, "loss": 1.071, "step": 18227 }, { "epoch": 0.55, "learning_rate": 2.2243223181731622e-06, "loss": 1.1083, "step": 18228 }, { "epoch": 0.55, "learning_rate": 2.2240798869717332e-06, "loss": 1.2521, "step": 18229 }, { "epoch": 0.55, "learning_rate": 2.2238374583969306e-06, "loss": 1.1646, "step": 18230 }, { "epoch": 0.55, "learning_rate": 2.2235950324510636e-06, "loss": 1.0702, "step": 18231 }, { "epoch": 0.55, "learning_rate": 2.223352609136438e-06, "loss": 1.1398, "step": 18232 }, { "epoch": 0.55, "learning_rate": 2.223110188455362e-06, "loss": 0.9959, "step": 18233 }, { "epoch": 0.55, "learning_rate": 2.2228677704101436e-06, "loss": 0.9294, "step": 18234 }, { "epoch": 0.55, "learning_rate": 2.2226253550030903e-06, "loss": 1.1379, "step": 18235 }, { "epoch": 0.55, "learning_rate": 2.2223829422365118e-06, "loss": 1.104, "step": 18236 }, { "epoch": 0.55, "learning_rate": 2.2221405321127125e-06, "loss": 1.1053, "step": 18237 }, { "epoch": 0.55, "learning_rate": 2.2218981246340014e-06, "loss": 1.1263, "step": 18238 }, { "epoch": 0.55, "learning_rate": 2.2216557198026864e-06, "loss": 1.097, "step": 18239 }, { "epoch": 0.55, "learning_rate": 2.2214133176210754e-06, "loss": 1.0999, "step": 18240 }, { "epoch": 0.55, "learning_rate": 2.221170918091475e-06, "loss": 1.1637, "step": 18241 }, { "epoch": 0.55, "learning_rate": 2.220928521216193e-06, "loss": 1.222, "step": 18242 }, { "epoch": 0.55, "learning_rate": 2.220686126997537e-06, "loss": 1.098, "step": 18243 }, { "epoch": 0.55, "learning_rate": 2.220443735437816e-06, "loss": 1.194, "step": 18244 }, { "epoch": 0.55, "learning_rate": 2.2202013465393346e-06, "loss": 1.1191, "step": 18245 }, { "epoch": 0.55, "learning_rate": 2.2199589603044017e-06, "loss": 1.066, "step": 18246 }, { "epoch": 0.55, "learning_rate": 2.2197165767353246e-06, "loss": 1.1578, "step": 18247 }, { "epoch": 0.55, "learning_rate": 2.2194741958344107e-06, "loss": 1.1705, "step": 18248 }, { "epoch": 0.55, "learning_rate": 2.2192318176039683e-06, "loss": 1.1783, "step": 18249 }, { "epoch": 0.55, "learning_rate": 2.2189894420463034e-06, "loss": 1.1198, "step": 18250 }, { "epoch": 0.55, "learning_rate": 2.218747069163723e-06, "loss": 1.1694, "step": 18251 }, { "epoch": 0.55, "learning_rate": 2.218504698958535e-06, "loss": 1.0232, "step": 18252 }, { "epoch": 0.55, "learning_rate": 2.2182623314330476e-06, "loss": 1.1432, "step": 18253 }, { "epoch": 0.55, "learning_rate": 2.2180199665895663e-06, "loss": 1.2308, "step": 18254 }, { "epoch": 0.55, "learning_rate": 2.2177776044303993e-06, "loss": 1.1415, "step": 18255 }, { "epoch": 0.55, "learning_rate": 2.217535244957853e-06, "loss": 1.1255, "step": 18256 }, { "epoch": 0.55, "learning_rate": 2.217292888174237e-06, "loss": 1.085, "step": 18257 }, { "epoch": 0.55, "learning_rate": 2.217050534081855e-06, "loss": 1.1688, "step": 18258 }, { "epoch": 0.55, "learning_rate": 2.216808182683016e-06, "loss": 1.1497, "step": 18259 }, { "epoch": 0.55, "learning_rate": 2.2165658339800266e-06, "loss": 1.019, "step": 18260 }, { "epoch": 0.55, "learning_rate": 2.2163234879751937e-06, "loss": 1.1619, "step": 18261 }, { "epoch": 0.55, "learning_rate": 2.216081144670826e-06, "loss": 1.1232, "step": 18262 }, { "epoch": 0.55, "learning_rate": 2.2158388040692278e-06, "loss": 1.0987, "step": 18263 }, { "epoch": 0.55, "learning_rate": 2.215596466172707e-06, "loss": 1.058, "step": 18264 }, { "epoch": 0.55, "learning_rate": 2.2153541309835715e-06, "loss": 1.0863, "step": 18265 }, { "epoch": 0.55, "learning_rate": 2.2151117985041278e-06, "loss": 1.2466, "step": 18266 }, { "epoch": 0.55, "learning_rate": 2.214869468736682e-06, "loss": 1.0848, "step": 18267 }, { "epoch": 0.55, "learning_rate": 2.2146271416835416e-06, "loss": 1.1898, "step": 18268 }, { "epoch": 0.55, "learning_rate": 2.2143848173470135e-06, "loss": 1.0918, "step": 18269 }, { "epoch": 0.55, "learning_rate": 2.2141424957294053e-06, "loss": 1.0848, "step": 18270 }, { "epoch": 0.55, "learning_rate": 2.2139001768330216e-06, "loss": 1.1344, "step": 18271 }, { "epoch": 0.55, "learning_rate": 2.213657860660171e-06, "loss": 1.15, "step": 18272 }, { "epoch": 0.55, "learning_rate": 2.2134155472131593e-06, "loss": 1.069, "step": 18273 }, { "epoch": 0.55, "learning_rate": 2.2131732364942934e-06, "loss": 1.2167, "step": 18274 }, { "epoch": 0.55, "learning_rate": 2.2129309285058815e-06, "loss": 1.1119, "step": 18275 }, { "epoch": 0.55, "learning_rate": 2.2126886232502274e-06, "loss": 1.1187, "step": 18276 }, { "epoch": 0.55, "learning_rate": 2.2124463207296398e-06, "loss": 1.0283, "step": 18277 }, { "epoch": 0.55, "learning_rate": 2.212204020946424e-06, "loss": 1.0771, "step": 18278 }, { "epoch": 0.55, "learning_rate": 2.2119617239028888e-06, "loss": 1.2192, "step": 18279 }, { "epoch": 0.55, "learning_rate": 2.211719429601338e-06, "loss": 1.0573, "step": 18280 }, { "epoch": 0.55, "learning_rate": 2.21147713804408e-06, "loss": 1.251, "step": 18281 }, { "epoch": 0.55, "learning_rate": 2.21123484923342e-06, "loss": 1.0673, "step": 18282 }, { "epoch": 0.55, "learning_rate": 2.210992563171667e-06, "loss": 1.11, "step": 18283 }, { "epoch": 0.55, "learning_rate": 2.210750279861124e-06, "loss": 1.2083, "step": 18284 }, { "epoch": 0.55, "learning_rate": 2.210507999304099e-06, "loss": 1.0718, "step": 18285 }, { "epoch": 0.55, "learning_rate": 2.2102657215028986e-06, "loss": 1.1376, "step": 18286 }, { "epoch": 0.55, "learning_rate": 2.210023446459829e-06, "loss": 1.1777, "step": 18287 }, { "epoch": 0.55, "learning_rate": 2.2097811741771973e-06, "loss": 1.1807, "step": 18288 }, { "epoch": 0.55, "learning_rate": 2.2095389046573084e-06, "loss": 1.1161, "step": 18289 }, { "epoch": 0.55, "learning_rate": 2.2092966379024693e-06, "loss": 1.0558, "step": 18290 }, { "epoch": 0.55, "learning_rate": 2.2090543739149855e-06, "loss": 0.9648, "step": 18291 }, { "epoch": 0.55, "learning_rate": 2.208812112697165e-06, "loss": 1.234, "step": 18292 }, { "epoch": 0.55, "learning_rate": 2.2085698542513126e-06, "loss": 1.1889, "step": 18293 }, { "epoch": 0.55, "learning_rate": 2.2083275985797344e-06, "loss": 1.1946, "step": 18294 }, { "epoch": 0.55, "learning_rate": 2.208085345684738e-06, "loss": 1.0875, "step": 18295 }, { "epoch": 0.55, "learning_rate": 2.207843095568628e-06, "loss": 1.1379, "step": 18296 }, { "epoch": 0.55, "learning_rate": 2.2076008482337107e-06, "loss": 1.0914, "step": 18297 }, { "epoch": 0.55, "learning_rate": 2.2073586036822923e-06, "loss": 1.1741, "step": 18298 }, { "epoch": 0.55, "learning_rate": 2.2071163619166793e-06, "loss": 1.2987, "step": 18299 }, { "epoch": 0.55, "learning_rate": 2.2068741229391778e-06, "loss": 1.1165, "step": 18300 }, { "epoch": 0.55, "learning_rate": 2.2066318867520937e-06, "loss": 1.0848, "step": 18301 }, { "epoch": 0.55, "learning_rate": 2.2063896533577327e-06, "loss": 1.1055, "step": 18302 }, { "epoch": 0.55, "learning_rate": 2.2061474227584e-06, "loss": 1.0702, "step": 18303 }, { "epoch": 0.55, "learning_rate": 2.2059051949564026e-06, "loss": 1.0439, "step": 18304 }, { "epoch": 0.55, "learning_rate": 2.205662969954047e-06, "loss": 1.1869, "step": 18305 }, { "epoch": 0.55, "learning_rate": 2.2054207477536375e-06, "loss": 1.2639, "step": 18306 }, { "epoch": 0.55, "learning_rate": 2.20517852835748e-06, "loss": 1.1332, "step": 18307 }, { "epoch": 0.55, "learning_rate": 2.204936311767881e-06, "loss": 1.0931, "step": 18308 }, { "epoch": 0.55, "learning_rate": 2.2046940979871474e-06, "loss": 1.1065, "step": 18309 }, { "epoch": 0.55, "learning_rate": 2.204451887017583e-06, "loss": 1.0738, "step": 18310 }, { "epoch": 0.55, "learning_rate": 2.204209678861494e-06, "loss": 1.129, "step": 18311 }, { "epoch": 0.55, "learning_rate": 2.203967473521186e-06, "loss": 1.1277, "step": 18312 }, { "epoch": 0.55, "learning_rate": 2.203725270998966e-06, "loss": 0.9816, "step": 18313 }, { "epoch": 0.55, "learning_rate": 2.2034830712971394e-06, "loss": 1.0471, "step": 18314 }, { "epoch": 0.55, "learning_rate": 2.20324087441801e-06, "loss": 1.1368, "step": 18315 }, { "epoch": 0.55, "learning_rate": 2.2029986803638847e-06, "loss": 0.9945, "step": 18316 }, { "epoch": 0.55, "learning_rate": 2.202756489137069e-06, "loss": 1.2177, "step": 18317 }, { "epoch": 0.55, "learning_rate": 2.202514300739869e-06, "loss": 1.1082, "step": 18318 }, { "epoch": 0.55, "learning_rate": 2.202272115174589e-06, "loss": 1.1437, "step": 18319 }, { "epoch": 0.55, "learning_rate": 2.202029932443535e-06, "loss": 1.0894, "step": 18320 }, { "epoch": 0.55, "learning_rate": 2.2017877525490123e-06, "loss": 1.2367, "step": 18321 }, { "epoch": 0.55, "learning_rate": 2.2015455754933275e-06, "loss": 1.1111, "step": 18322 }, { "epoch": 0.55, "learning_rate": 2.201303401278784e-06, "loss": 1.1359, "step": 18323 }, { "epoch": 0.55, "learning_rate": 2.201061229907689e-06, "loss": 1.2392, "step": 18324 }, { "epoch": 0.55, "learning_rate": 2.200819061382346e-06, "loss": 1.0987, "step": 18325 }, { "epoch": 0.55, "learning_rate": 2.200576895705062e-06, "loss": 1.046, "step": 18326 }, { "epoch": 0.55, "learning_rate": 2.2003347328781433e-06, "loss": 1.1072, "step": 18327 }, { "epoch": 0.55, "learning_rate": 2.2000925729038922e-06, "loss": 1.1032, "step": 18328 }, { "epoch": 0.55, "learning_rate": 2.1998504157846152e-06, "loss": 1.108, "step": 18329 }, { "epoch": 0.55, "learning_rate": 2.199608261522618e-06, "loss": 1.0274, "step": 18330 }, { "epoch": 0.55, "learning_rate": 2.1993661101202064e-06, "loss": 1.1189, "step": 18331 }, { "epoch": 0.55, "learning_rate": 2.1991239615796833e-06, "loss": 1.0402, "step": 18332 }, { "epoch": 0.55, "learning_rate": 2.198881815903355e-06, "loss": 1.1306, "step": 18333 }, { "epoch": 0.55, "learning_rate": 2.1986396730935275e-06, "loss": 0.9943, "step": 18334 }, { "epoch": 0.55, "learning_rate": 2.1983975331525056e-06, "loss": 1.1342, "step": 18335 }, { "epoch": 0.55, "learning_rate": 2.198155396082593e-06, "loss": 1.2175, "step": 18336 }, { "epoch": 0.55, "learning_rate": 2.197913261886096e-06, "loss": 1.1702, "step": 18337 }, { "epoch": 0.55, "learning_rate": 2.197671130565319e-06, "loss": 1.1566, "step": 18338 }, { "epoch": 0.55, "learning_rate": 2.1974290021225672e-06, "loss": 1.2028, "step": 18339 }, { "epoch": 0.55, "learning_rate": 2.197186876560147e-06, "loss": 1.0823, "step": 18340 }, { "epoch": 0.55, "learning_rate": 2.196944753880361e-06, "loss": 1.0901, "step": 18341 }, { "epoch": 0.55, "learning_rate": 2.196702634085514e-06, "loss": 1.0924, "step": 18342 }, { "epoch": 0.55, "learning_rate": 2.1964605171779124e-06, "loss": 1.22, "step": 18343 }, { "epoch": 0.55, "learning_rate": 2.196218403159862e-06, "loss": 1.04, "step": 18344 }, { "epoch": 0.55, "learning_rate": 2.1959762920336643e-06, "loss": 1.1479, "step": 18345 }, { "epoch": 0.55, "learning_rate": 2.1957341838016265e-06, "loss": 1.0876, "step": 18346 }, { "epoch": 0.55, "learning_rate": 2.195492078466052e-06, "loss": 1.0892, "step": 18347 }, { "epoch": 0.55, "learning_rate": 2.1952499760292474e-06, "loss": 1.178, "step": 18348 }, { "epoch": 0.55, "learning_rate": 2.1950078764935156e-06, "loss": 1.1271, "step": 18349 }, { "epoch": 0.55, "learning_rate": 2.1947657798611617e-06, "loss": 1.2216, "step": 18350 }, { "epoch": 0.55, "learning_rate": 2.194523686134491e-06, "loss": 1.0249, "step": 18351 }, { "epoch": 0.55, "learning_rate": 2.194281595315807e-06, "loss": 1.0363, "step": 18352 }, { "epoch": 0.55, "learning_rate": 2.194039507407417e-06, "loss": 1.1021, "step": 18353 }, { "epoch": 0.55, "learning_rate": 2.193797422411622e-06, "loss": 1.138, "step": 18354 }, { "epoch": 0.55, "learning_rate": 2.1935553403307277e-06, "loss": 1.0732, "step": 18355 }, { "epoch": 0.55, "learning_rate": 2.1933132611670395e-06, "loss": 1.0559, "step": 18356 }, { "epoch": 0.55, "learning_rate": 2.1930711849228618e-06, "loss": 1.1052, "step": 18357 }, { "epoch": 0.55, "learning_rate": 2.1928291116004983e-06, "loss": 1.0383, "step": 18358 }, { "epoch": 0.55, "learning_rate": 2.192587041202253e-06, "loss": 1.0784, "step": 18359 }, { "epoch": 0.55, "learning_rate": 2.1923449737304314e-06, "loss": 1.0482, "step": 18360 }, { "epoch": 0.55, "learning_rate": 2.192102909187338e-06, "loss": 1.2664, "step": 18361 }, { "epoch": 0.55, "learning_rate": 2.191860847575276e-06, "loss": 1.1669, "step": 18362 }, { "epoch": 0.55, "learning_rate": 2.191618788896551e-06, "loss": 1.1469, "step": 18363 }, { "epoch": 0.55, "learning_rate": 2.1913767331534655e-06, "loss": 1.1003, "step": 18364 }, { "epoch": 0.55, "learning_rate": 2.191134680348325e-06, "loss": 0.9663, "step": 18365 }, { "epoch": 0.55, "learning_rate": 2.1908926304834354e-06, "loss": 1.1909, "step": 18366 }, { "epoch": 0.55, "learning_rate": 2.1906505835610975e-06, "loss": 1.1372, "step": 18367 }, { "epoch": 0.55, "learning_rate": 2.190408539583617e-06, "loss": 1.1501, "step": 18368 }, { "epoch": 0.55, "learning_rate": 2.1901664985532985e-06, "loss": 1.1472, "step": 18369 }, { "epoch": 0.55, "learning_rate": 2.189924460472447e-06, "loss": 1.1133, "step": 18370 }, { "epoch": 0.55, "learning_rate": 2.1896824253433635e-06, "loss": 1.112, "step": 18371 }, { "epoch": 0.55, "learning_rate": 2.189440393168354e-06, "loss": 1.1477, "step": 18372 }, { "epoch": 0.55, "learning_rate": 2.1891983639497224e-06, "loss": 1.0427, "step": 18373 }, { "epoch": 0.55, "learning_rate": 2.1889563376897737e-06, "loss": 1.1997, "step": 18374 }, { "epoch": 0.55, "learning_rate": 2.18871431439081e-06, "loss": 1.2051, "step": 18375 }, { "epoch": 0.55, "learning_rate": 2.188472294055136e-06, "loss": 1.0682, "step": 18376 }, { "epoch": 0.55, "learning_rate": 2.1882302766850563e-06, "loss": 1.0164, "step": 18377 }, { "epoch": 0.55, "learning_rate": 2.1879882622828735e-06, "loss": 1.0808, "step": 18378 }, { "epoch": 0.55, "learning_rate": 2.187746250850893e-06, "loss": 1.1317, "step": 18379 }, { "epoch": 0.55, "learning_rate": 2.187504242391417e-06, "loss": 1.0598, "step": 18380 }, { "epoch": 0.55, "learning_rate": 2.1872622369067505e-06, "loss": 1.0648, "step": 18381 }, { "epoch": 0.55, "learning_rate": 2.187020234399197e-06, "loss": 1.1319, "step": 18382 }, { "epoch": 0.55, "learning_rate": 2.1867782348710607e-06, "loss": 1.0491, "step": 18383 }, { "epoch": 0.55, "learning_rate": 2.1865362383246437e-06, "loss": 1.0847, "step": 18384 }, { "epoch": 0.55, "learning_rate": 2.186294244762251e-06, "loss": 1.1276, "step": 18385 }, { "epoch": 0.55, "learning_rate": 2.1860522541861862e-06, "loss": 1.1456, "step": 18386 }, { "epoch": 0.55, "learning_rate": 2.185810266598753e-06, "loss": 1.0123, "step": 18387 }, { "epoch": 0.55, "learning_rate": 2.1855682820022546e-06, "loss": 1.0899, "step": 18388 }, { "epoch": 0.55, "learning_rate": 2.185326300398994e-06, "loss": 1.1667, "step": 18389 }, { "epoch": 0.55, "learning_rate": 2.185084321791276e-06, "loss": 1.2034, "step": 18390 }, { "epoch": 0.55, "learning_rate": 2.184842346181404e-06, "loss": 1.1876, "step": 18391 }, { "epoch": 0.55, "learning_rate": 2.18460037357168e-06, "loss": 1.0785, "step": 18392 }, { "epoch": 0.55, "learning_rate": 2.1843584039644095e-06, "loss": 1.1306, "step": 18393 }, { "epoch": 0.55, "learning_rate": 2.1841164373618946e-06, "loss": 1.2191, "step": 18394 }, { "epoch": 0.55, "learning_rate": 2.183874473766439e-06, "loss": 1.187, "step": 18395 }, { "epoch": 0.55, "learning_rate": 2.183632513180347e-06, "loss": 1.0518, "step": 18396 }, { "epoch": 0.55, "learning_rate": 2.1833905556059202e-06, "loss": 1.1575, "step": 18397 }, { "epoch": 0.55, "learning_rate": 2.1831486010454627e-06, "loss": 1.2056, "step": 18398 }, { "epoch": 0.55, "learning_rate": 2.182906649501278e-06, "loss": 1.1064, "step": 18399 }, { "epoch": 0.55, "learning_rate": 2.1826647009756707e-06, "loss": 1.2324, "step": 18400 }, { "epoch": 0.55, "learning_rate": 2.182422755470941e-06, "loss": 1.0498, "step": 18401 }, { "epoch": 0.55, "learning_rate": 2.182180812989394e-06, "loss": 1.1915, "step": 18402 }, { "epoch": 0.55, "learning_rate": 2.1819388735333327e-06, "loss": 1.0871, "step": 18403 }, { "epoch": 0.55, "learning_rate": 2.1816969371050605e-06, "loss": 1.1342, "step": 18404 }, { "epoch": 0.55, "learning_rate": 2.18145500370688e-06, "loss": 1.1516, "step": 18405 }, { "epoch": 0.55, "learning_rate": 2.1812130733410937e-06, "loss": 1.2537, "step": 18406 }, { "epoch": 0.55, "learning_rate": 2.1809711460100057e-06, "loss": 1.1302, "step": 18407 }, { "epoch": 0.55, "learning_rate": 2.180729221715919e-06, "loss": 1.1207, "step": 18408 }, { "epoch": 0.55, "learning_rate": 2.1804873004611372e-06, "loss": 1.1923, "step": 18409 }, { "epoch": 0.55, "learning_rate": 2.1802453822479617e-06, "loss": 1.0773, "step": 18410 }, { "epoch": 0.55, "learning_rate": 2.1800034670786956e-06, "loss": 1.0449, "step": 18411 }, { "epoch": 0.55, "learning_rate": 2.179761554955643e-06, "loss": 1.1783, "step": 18412 }, { "epoch": 0.55, "learning_rate": 2.179519645881107e-06, "loss": 1.1348, "step": 18413 }, { "epoch": 0.55, "learning_rate": 2.179277739857388e-06, "loss": 1.024, "step": 18414 }, { "epoch": 0.55, "learning_rate": 2.179035836886791e-06, "loss": 1.0501, "step": 18415 }, { "epoch": 0.55, "learning_rate": 2.178793936971618e-06, "loss": 1.1273, "step": 18416 }, { "epoch": 0.55, "learning_rate": 2.178552040114173e-06, "loss": 1.0458, "step": 18417 }, { "epoch": 0.55, "learning_rate": 2.178310146316757e-06, "loss": 1.3142, "step": 18418 }, { "epoch": 0.55, "learning_rate": 2.1780682555816733e-06, "loss": 1.1232, "step": 18419 }, { "epoch": 0.55, "learning_rate": 2.177826367911225e-06, "loss": 1.093, "step": 18420 }, { "epoch": 0.55, "learning_rate": 2.177584483307714e-06, "loss": 1.2118, "step": 18421 }, { "epoch": 0.55, "learning_rate": 2.1773426017734454e-06, "loss": 1.0427, "step": 18422 }, { "epoch": 0.55, "learning_rate": 2.177100723310718e-06, "loss": 1.2719, "step": 18423 }, { "epoch": 0.56, "learning_rate": 2.1768588479218367e-06, "loss": 1.0515, "step": 18424 }, { "epoch": 0.56, "learning_rate": 2.1766169756091034e-06, "loss": 1.1258, "step": 18425 }, { "epoch": 0.56, "learning_rate": 2.1763751063748215e-06, "loss": 1.1393, "step": 18426 }, { "epoch": 0.56, "learning_rate": 2.176133240221292e-06, "loss": 1.1303, "step": 18427 }, { "epoch": 0.56, "learning_rate": 2.1758913771508178e-06, "loss": 1.0704, "step": 18428 }, { "epoch": 0.56, "learning_rate": 2.1756495171657016e-06, "loss": 1.1299, "step": 18429 }, { "epoch": 0.56, "learning_rate": 2.1754076602682467e-06, "loss": 1.0614, "step": 18430 }, { "epoch": 0.56, "learning_rate": 2.1751658064607535e-06, "loss": 1.1577, "step": 18431 }, { "epoch": 0.56, "learning_rate": 2.174923955745526e-06, "loss": 1.0952, "step": 18432 }, { "epoch": 0.56, "learning_rate": 2.1746821081248654e-06, "loss": 1.0942, "step": 18433 }, { "epoch": 0.56, "learning_rate": 2.1744402636010744e-06, "loss": 1.0072, "step": 18434 }, { "epoch": 0.56, "learning_rate": 2.1741984221764567e-06, "loss": 1.1451, "step": 18435 }, { "epoch": 0.56, "learning_rate": 2.173956583853312e-06, "loss": 1.1776, "step": 18436 }, { "epoch": 0.56, "learning_rate": 2.1737147486339434e-06, "loss": 1.2236, "step": 18437 }, { "epoch": 0.56, "learning_rate": 2.173472916520653e-06, "loss": 0.9957, "step": 18438 }, { "epoch": 0.56, "learning_rate": 2.173231087515745e-06, "loss": 1.1697, "step": 18439 }, { "epoch": 0.56, "learning_rate": 2.172989261621518e-06, "loss": 0.9693, "step": 18440 }, { "epoch": 0.56, "learning_rate": 2.1727474388402756e-06, "loss": 1.0538, "step": 18441 }, { "epoch": 0.56, "learning_rate": 2.1725056191743203e-06, "loss": 1.1697, "step": 18442 }, { "epoch": 0.56, "learning_rate": 2.1722638026259545e-06, "loss": 1.1837, "step": 18443 }, { "epoch": 0.56, "learning_rate": 2.1720219891974787e-06, "loss": 1.0073, "step": 18444 }, { "epoch": 0.56, "learning_rate": 2.1717801788911955e-06, "loss": 1.1773, "step": 18445 }, { "epoch": 0.56, "learning_rate": 2.1715383717094073e-06, "loss": 1.1388, "step": 18446 }, { "epoch": 0.56, "learning_rate": 2.171296567654415e-06, "loss": 1.1121, "step": 18447 }, { "epoch": 0.56, "learning_rate": 2.1710547667285227e-06, "loss": 1.1571, "step": 18448 }, { "epoch": 0.56, "learning_rate": 2.1708129689340292e-06, "loss": 1.0723, "step": 18449 }, { "epoch": 0.56, "learning_rate": 2.170571174273238e-06, "loss": 1.0845, "step": 18450 }, { "epoch": 0.56, "learning_rate": 2.1703293827484504e-06, "loss": 1.1129, "step": 18451 }, { "epoch": 0.56, "learning_rate": 2.1700875943619692e-06, "loss": 0.9504, "step": 18452 }, { "epoch": 0.56, "learning_rate": 2.1698458091160943e-06, "loss": 1.178, "step": 18453 }, { "epoch": 0.56, "learning_rate": 2.1696040270131284e-06, "loss": 1.0582, "step": 18454 }, { "epoch": 0.56, "learning_rate": 2.169362248055373e-06, "loss": 0.9996, "step": 18455 }, { "epoch": 0.56, "learning_rate": 2.16912047224513e-06, "loss": 1.1436, "step": 18456 }, { "epoch": 0.56, "learning_rate": 2.1688786995847e-06, "loss": 1.1093, "step": 18457 }, { "epoch": 0.56, "learning_rate": 2.168636930076386e-06, "loss": 1.1201, "step": 18458 }, { "epoch": 0.56, "learning_rate": 2.168395163722489e-06, "loss": 1.1959, "step": 18459 }, { "epoch": 0.56, "learning_rate": 2.16815340052531e-06, "loss": 1.1185, "step": 18460 }, { "epoch": 0.56, "learning_rate": 2.167911640487151e-06, "loss": 1.1537, "step": 18461 }, { "epoch": 0.56, "learning_rate": 2.1676698836103132e-06, "loss": 1.1395, "step": 18462 }, { "epoch": 0.56, "learning_rate": 2.1674281298970977e-06, "loss": 1.1777, "step": 18463 }, { "epoch": 0.56, "learning_rate": 2.1671863793498064e-06, "loss": 0.979, "step": 18464 }, { "epoch": 0.56, "learning_rate": 2.1669446319707414e-06, "loss": 1.0674, "step": 18465 }, { "epoch": 0.56, "learning_rate": 2.166702887762202e-06, "loss": 1.1656, "step": 18466 }, { "epoch": 0.56, "learning_rate": 2.1664611467264906e-06, "loss": 1.1385, "step": 18467 }, { "epoch": 0.56, "learning_rate": 2.166219408865909e-06, "loss": 1.1266, "step": 18468 }, { "epoch": 0.56, "learning_rate": 2.1659776741827577e-06, "loss": 1.1602, "step": 18469 }, { "epoch": 0.56, "learning_rate": 2.165735942679338e-06, "loss": 1.1235, "step": 18470 }, { "epoch": 0.56, "learning_rate": 2.165494214357951e-06, "loss": 1.0527, "step": 18471 }, { "epoch": 0.56, "learning_rate": 2.1652524892208983e-06, "loss": 1.1505, "step": 18472 }, { "epoch": 0.56, "learning_rate": 2.1650107672704803e-06, "loss": 1.1576, "step": 18473 }, { "epoch": 0.56, "learning_rate": 2.1647690485089986e-06, "loss": 1.1799, "step": 18474 }, { "epoch": 0.56, "learning_rate": 2.164527332938754e-06, "loss": 1.1251, "step": 18475 }, { "epoch": 0.56, "learning_rate": 2.1642856205620476e-06, "loss": 1.1157, "step": 18476 }, { "epoch": 0.56, "learning_rate": 2.16404391138118e-06, "loss": 1.1172, "step": 18477 }, { "epoch": 0.56, "learning_rate": 2.1638022053984542e-06, "loss": 1.0547, "step": 18478 }, { "epoch": 0.56, "learning_rate": 2.163560502616168e-06, "loss": 1.0377, "step": 18479 }, { "epoch": 0.56, "learning_rate": 2.1633188030366242e-06, "loss": 1.1381, "step": 18480 }, { "epoch": 0.56, "learning_rate": 2.163077106662123e-06, "loss": 1.1854, "step": 18481 }, { "epoch": 0.56, "learning_rate": 2.1628354134949666e-06, "loss": 1.1223, "step": 18482 }, { "epoch": 0.56, "learning_rate": 2.1625937235374535e-06, "loss": 1.0361, "step": 18483 }, { "epoch": 0.56, "learning_rate": 2.162352036791886e-06, "loss": 1.0149, "step": 18484 }, { "epoch": 0.56, "learning_rate": 2.162110353260564e-06, "loss": 1.1516, "step": 18485 }, { "epoch": 0.56, "learning_rate": 2.1618686729457892e-06, "loss": 1.0838, "step": 18486 }, { "epoch": 0.56, "learning_rate": 2.161626995849862e-06, "loss": 1.1641, "step": 18487 }, { "epoch": 0.56, "learning_rate": 2.1613853219750825e-06, "loss": 1.1398, "step": 18488 }, { "epoch": 0.56, "learning_rate": 2.1611436513237512e-06, "loss": 1.1295, "step": 18489 }, { "epoch": 0.56, "learning_rate": 2.1609019838981696e-06, "loss": 1.1263, "step": 18490 }, { "epoch": 0.56, "learning_rate": 2.1606603197006386e-06, "loss": 1.0591, "step": 18491 }, { "epoch": 0.56, "learning_rate": 2.160418658733457e-06, "loss": 1.1483, "step": 18492 }, { "epoch": 0.56, "learning_rate": 2.1601770009989264e-06, "loss": 1.093, "step": 18493 }, { "epoch": 0.56, "learning_rate": 2.1599353464993466e-06, "loss": 1.1116, "step": 18494 }, { "epoch": 0.56, "learning_rate": 2.15969369523702e-06, "loss": 1.0399, "step": 18495 }, { "epoch": 0.56, "learning_rate": 2.1594520472142443e-06, "loss": 1.1722, "step": 18496 }, { "epoch": 0.56, "learning_rate": 2.159210402433321e-06, "loss": 1.0737, "step": 18497 }, { "epoch": 0.56, "learning_rate": 2.1589687608965507e-06, "loss": 1.1291, "step": 18498 }, { "epoch": 0.56, "learning_rate": 2.1587271226062334e-06, "loss": 1.1412, "step": 18499 }, { "epoch": 0.56, "learning_rate": 2.1584854875646704e-06, "loss": 1.0901, "step": 18500 }, { "epoch": 0.56, "learning_rate": 2.1582438557741605e-06, "loss": 1.048, "step": 18501 }, { "epoch": 0.56, "learning_rate": 2.158002227237004e-06, "loss": 1.1371, "step": 18502 }, { "epoch": 0.56, "learning_rate": 2.157760601955502e-06, "loss": 1.1899, "step": 18503 }, { "epoch": 0.56, "learning_rate": 2.1575189799319552e-06, "loss": 1.0049, "step": 18504 }, { "epoch": 0.56, "learning_rate": 2.1572773611686616e-06, "loss": 1.1959, "step": 18505 }, { "epoch": 0.56, "learning_rate": 2.1570357456679226e-06, "loss": 1.0903, "step": 18506 }, { "epoch": 0.56, "learning_rate": 2.156794133432038e-06, "loss": 1.1413, "step": 18507 }, { "epoch": 0.56, "learning_rate": 2.156552524463309e-06, "loss": 1.1627, "step": 18508 }, { "epoch": 0.56, "learning_rate": 2.156310918764034e-06, "loss": 1.127, "step": 18509 }, { "epoch": 0.56, "learning_rate": 2.1560693163365127e-06, "loss": 1.1282, "step": 18510 }, { "epoch": 0.56, "learning_rate": 2.1558277171830466e-06, "loss": 1.0903, "step": 18511 }, { "epoch": 0.56, "learning_rate": 2.1555861213059344e-06, "loss": 1.1228, "step": 18512 }, { "epoch": 0.56, "learning_rate": 2.155344528707477e-06, "loss": 1.0689, "step": 18513 }, { "epoch": 0.56, "learning_rate": 2.1551029393899736e-06, "loss": 1.1322, "step": 18514 }, { "epoch": 0.56, "learning_rate": 2.154861353355724e-06, "loss": 1.0526, "step": 18515 }, { "epoch": 0.56, "learning_rate": 2.1546197706070275e-06, "loss": 1.101, "step": 18516 }, { "epoch": 0.56, "learning_rate": 2.1543781911461863e-06, "loss": 1.1212, "step": 18517 }, { "epoch": 0.56, "learning_rate": 2.154136614975497e-06, "loss": 1.1147, "step": 18518 }, { "epoch": 0.56, "learning_rate": 2.15389504209726e-06, "loss": 1.1225, "step": 18519 }, { "epoch": 0.56, "learning_rate": 2.153653472513776e-06, "loss": 1.1214, "step": 18520 }, { "epoch": 0.56, "learning_rate": 2.153411906227345e-06, "loss": 1.0927, "step": 18521 }, { "epoch": 0.56, "learning_rate": 2.153170343240265e-06, "loss": 1.1768, "step": 18522 }, { "epoch": 0.56, "learning_rate": 2.152928783554836e-06, "loss": 1.1874, "step": 18523 }, { "epoch": 0.56, "learning_rate": 2.1526872271733577e-06, "loss": 1.1902, "step": 18524 }, { "epoch": 0.56, "learning_rate": 2.15244567409813e-06, "loss": 0.9997, "step": 18525 }, { "epoch": 0.56, "learning_rate": 2.1522041243314525e-06, "loss": 1.1086, "step": 18526 }, { "epoch": 0.56, "learning_rate": 2.1519625778756237e-06, "loss": 1.1345, "step": 18527 }, { "epoch": 0.56, "learning_rate": 2.1517210347329435e-06, "loss": 1.078, "step": 18528 }, { "epoch": 0.56, "learning_rate": 2.151479494905711e-06, "loss": 1.0695, "step": 18529 }, { "epoch": 0.56, "learning_rate": 2.1512379583962277e-06, "loss": 1.1329, "step": 18530 }, { "epoch": 0.56, "learning_rate": 2.1509964252067894e-06, "loss": 1.003, "step": 18531 }, { "epoch": 0.56, "learning_rate": 2.1507548953396973e-06, "loss": 1.0345, "step": 18532 }, { "epoch": 0.56, "learning_rate": 2.1505133687972505e-06, "loss": 1.1245, "step": 18533 }, { "epoch": 0.56, "learning_rate": 2.150271845581749e-06, "loss": 1.1139, "step": 18534 }, { "epoch": 0.56, "learning_rate": 2.15003032569549e-06, "loss": 1.077, "step": 18535 }, { "epoch": 0.56, "learning_rate": 2.1497888091407736e-06, "loss": 1.072, "step": 18536 }, { "epoch": 0.56, "learning_rate": 2.1495472959198994e-06, "loss": 1.1458, "step": 18537 }, { "epoch": 0.56, "learning_rate": 2.149305786035166e-06, "loss": 1.1395, "step": 18538 }, { "epoch": 0.56, "learning_rate": 2.149064279488873e-06, "loss": 1.0349, "step": 18539 }, { "epoch": 0.56, "learning_rate": 2.1488227762833187e-06, "loss": 1.0989, "step": 18540 }, { "epoch": 0.56, "learning_rate": 2.1485812764208025e-06, "loss": 1.0634, "step": 18541 }, { "epoch": 0.56, "learning_rate": 2.148339779903624e-06, "loss": 1.1371, "step": 18542 }, { "epoch": 0.56, "learning_rate": 2.148098286734081e-06, "loss": 1.1053, "step": 18543 }, { "epoch": 0.56, "learning_rate": 2.1478567969144726e-06, "loss": 1.1112, "step": 18544 }, { "epoch": 0.56, "learning_rate": 2.1476153104470977e-06, "loss": 1.1367, "step": 18545 }, { "epoch": 0.56, "learning_rate": 2.1473738273342553e-06, "loss": 1.131, "step": 18546 }, { "epoch": 0.56, "learning_rate": 2.1471323475782455e-06, "loss": 1.1193, "step": 18547 }, { "epoch": 0.56, "learning_rate": 2.1468908711813647e-06, "loss": 1.0791, "step": 18548 }, { "epoch": 0.56, "learning_rate": 2.1466493981459126e-06, "loss": 1.2239, "step": 18549 }, { "epoch": 0.56, "learning_rate": 2.146407928474188e-06, "loss": 1.0455, "step": 18550 }, { "epoch": 0.56, "learning_rate": 2.1461664621684897e-06, "loss": 1.1403, "step": 18551 }, { "epoch": 0.56, "learning_rate": 2.145924999231117e-06, "loss": 1.1382, "step": 18552 }, { "epoch": 0.56, "learning_rate": 2.145683539664368e-06, "loss": 1.0178, "step": 18553 }, { "epoch": 0.56, "learning_rate": 2.1454420834705396e-06, "loss": 1.1924, "step": 18554 }, { "epoch": 0.56, "learning_rate": 2.1452006306519322e-06, "loss": 1.0978, "step": 18555 }, { "epoch": 0.56, "learning_rate": 2.144959181210845e-06, "loss": 1.1605, "step": 18556 }, { "epoch": 0.56, "learning_rate": 2.1447177351495746e-06, "loss": 1.179, "step": 18557 }, { "epoch": 0.56, "learning_rate": 2.14447629247042e-06, "loss": 1.1379, "step": 18558 }, { "epoch": 0.56, "learning_rate": 2.14423485317568e-06, "loss": 1.1107, "step": 18559 }, { "epoch": 0.56, "learning_rate": 2.143993417267654e-06, "loss": 1.0507, "step": 18560 }, { "epoch": 0.56, "learning_rate": 2.143751984748638e-06, "loss": 1.1308, "step": 18561 }, { "epoch": 0.56, "learning_rate": 2.1435105556209316e-06, "loss": 1.0793, "step": 18562 }, { "epoch": 0.56, "learning_rate": 2.143269129886833e-06, "loss": 1.0979, "step": 18563 }, { "epoch": 0.56, "learning_rate": 2.1430277075486405e-06, "loss": 1.1359, "step": 18564 }, { "epoch": 0.56, "learning_rate": 2.1427862886086536e-06, "loss": 1.1115, "step": 18565 }, { "epoch": 0.56, "learning_rate": 2.1425448730691677e-06, "loss": 1.0593, "step": 18566 }, { "epoch": 0.56, "learning_rate": 2.1423034609324825e-06, "loss": 1.1487, "step": 18567 }, { "epoch": 0.56, "learning_rate": 2.142062052200896e-06, "loss": 1.2585, "step": 18568 }, { "epoch": 0.56, "learning_rate": 2.141820646876707e-06, "loss": 1.0703, "step": 18569 }, { "epoch": 0.56, "learning_rate": 2.141579244962213e-06, "loss": 1.1073, "step": 18570 }, { "epoch": 0.56, "learning_rate": 2.1413378464597115e-06, "loss": 1.0983, "step": 18571 }, { "epoch": 0.56, "learning_rate": 2.1410964513715007e-06, "loss": 1.0933, "step": 18572 }, { "epoch": 0.56, "learning_rate": 2.1408550596998803e-06, "loss": 1.2638, "step": 18573 }, { "epoch": 0.56, "learning_rate": 2.1406136714471458e-06, "loss": 1.1992, "step": 18574 }, { "epoch": 0.56, "learning_rate": 2.1403722866155955e-06, "loss": 1.2626, "step": 18575 }, { "epoch": 0.56, "learning_rate": 2.140130905207528e-06, "loss": 1.0295, "step": 18576 }, { "epoch": 0.56, "learning_rate": 2.1398895272252424e-06, "loss": 1.0544, "step": 18577 }, { "epoch": 0.56, "learning_rate": 2.139648152671034e-06, "loss": 1.0352, "step": 18578 }, { "epoch": 0.56, "learning_rate": 2.1394067815472012e-06, "loss": 1.0618, "step": 18579 }, { "epoch": 0.56, "learning_rate": 2.1391654138560424e-06, "loss": 1.1829, "step": 18580 }, { "epoch": 0.56, "learning_rate": 2.138924049599855e-06, "loss": 1.1246, "step": 18581 }, { "epoch": 0.56, "learning_rate": 2.138682688780937e-06, "loss": 1.1539, "step": 18582 }, { "epoch": 0.56, "learning_rate": 2.1384413314015858e-06, "loss": 1.0846, "step": 18583 }, { "epoch": 0.56, "learning_rate": 2.1381999774640986e-06, "loss": 1.127, "step": 18584 }, { "epoch": 0.56, "learning_rate": 2.137958626970774e-06, "loss": 1.1866, "step": 18585 }, { "epoch": 0.56, "learning_rate": 2.1377172799239092e-06, "loss": 1.2029, "step": 18586 }, { "epoch": 0.56, "learning_rate": 2.137475936325801e-06, "loss": 1.0718, "step": 18587 }, { "epoch": 0.56, "learning_rate": 2.1372345961787466e-06, "loss": 1.1064, "step": 18588 }, { "epoch": 0.56, "learning_rate": 2.1369932594850444e-06, "loss": 1.1667, "step": 18589 }, { "epoch": 0.56, "learning_rate": 2.136751926246993e-06, "loss": 1.1109, "step": 18590 }, { "epoch": 0.56, "learning_rate": 2.1365105964668868e-06, "loss": 1.0528, "step": 18591 }, { "epoch": 0.56, "learning_rate": 2.136269270147025e-06, "loss": 1.0887, "step": 18592 }, { "epoch": 0.56, "learning_rate": 2.136027947289704e-06, "loss": 1.1543, "step": 18593 }, { "epoch": 0.56, "learning_rate": 2.1357866278972224e-06, "loss": 1.0231, "step": 18594 }, { "epoch": 0.56, "learning_rate": 2.1355453119718766e-06, "loss": 1.1093, "step": 18595 }, { "epoch": 0.56, "learning_rate": 2.1353039995159637e-06, "loss": 1.0469, "step": 18596 }, { "epoch": 0.56, "learning_rate": 2.135062690531781e-06, "loss": 1.1535, "step": 18597 }, { "epoch": 0.56, "learning_rate": 2.134821385021626e-06, "loss": 1.1697, "step": 18598 }, { "epoch": 0.56, "learning_rate": 2.134580082987796e-06, "loss": 1.144, "step": 18599 }, { "epoch": 0.56, "learning_rate": 2.134338784432587e-06, "loss": 1.1179, "step": 18600 }, { "epoch": 0.56, "learning_rate": 2.1340974893582963e-06, "loss": 1.1049, "step": 18601 }, { "epoch": 0.56, "learning_rate": 2.133856197767222e-06, "loss": 1.0996, "step": 18602 }, { "epoch": 0.56, "learning_rate": 2.1336149096616606e-06, "loss": 1.2218, "step": 18603 }, { "epoch": 0.56, "learning_rate": 2.133373625043908e-06, "loss": 1.1201, "step": 18604 }, { "epoch": 0.56, "learning_rate": 2.1331323439162623e-06, "loss": 1.1199, "step": 18605 }, { "epoch": 0.56, "learning_rate": 2.132891066281019e-06, "loss": 1.2786, "step": 18606 }, { "epoch": 0.56, "learning_rate": 2.132649792140477e-06, "loss": 1.0687, "step": 18607 }, { "epoch": 0.56, "learning_rate": 2.132408521496932e-06, "loss": 1.2113, "step": 18608 }, { "epoch": 0.56, "learning_rate": 2.1321672543526805e-06, "loss": 1.0458, "step": 18609 }, { "epoch": 0.56, "learning_rate": 2.1319259907100198e-06, "loss": 1.046, "step": 18610 }, { "epoch": 0.56, "learning_rate": 2.1316847305712464e-06, "loss": 1.1392, "step": 18611 }, { "epoch": 0.56, "learning_rate": 2.131443473938658e-06, "loss": 1.0631, "step": 18612 }, { "epoch": 0.56, "learning_rate": 2.131202220814549e-06, "loss": 1.0074, "step": 18613 }, { "epoch": 0.56, "learning_rate": 2.130960971201217e-06, "loss": 1.1164, "step": 18614 }, { "epoch": 0.56, "learning_rate": 2.1307197251009588e-06, "loss": 0.9899, "step": 18615 }, { "epoch": 0.56, "learning_rate": 2.1304784825160725e-06, "loss": 1.1432, "step": 18616 }, { "epoch": 0.56, "learning_rate": 2.1302372434488517e-06, "loss": 1.1169, "step": 18617 }, { "epoch": 0.56, "learning_rate": 2.1299960079015945e-06, "loss": 1.0366, "step": 18618 }, { "epoch": 0.56, "learning_rate": 2.129754775876597e-06, "loss": 1.1526, "step": 18619 }, { "epoch": 0.56, "learning_rate": 2.1295135473761557e-06, "loss": 1.0276, "step": 18620 }, { "epoch": 0.56, "learning_rate": 2.1292723224025675e-06, "loss": 1.0145, "step": 18621 }, { "epoch": 0.56, "learning_rate": 2.1290311009581277e-06, "loss": 1.1824, "step": 18622 }, { "epoch": 0.56, "learning_rate": 2.128789883045133e-06, "loss": 1.1304, "step": 18623 }, { "epoch": 0.56, "learning_rate": 2.1285486686658805e-06, "loss": 1.1613, "step": 18624 }, { "epoch": 0.56, "learning_rate": 2.1283074578226658e-06, "loss": 1.1276, "step": 18625 }, { "epoch": 0.56, "learning_rate": 2.128066250517785e-06, "loss": 1.1149, "step": 18626 }, { "epoch": 0.56, "learning_rate": 2.127825046753534e-06, "loss": 1.1103, "step": 18627 }, { "epoch": 0.56, "learning_rate": 2.1275838465322092e-06, "loss": 1.0486, "step": 18628 }, { "epoch": 0.56, "learning_rate": 2.127342649856108e-06, "loss": 1.1835, "step": 18629 }, { "epoch": 0.56, "learning_rate": 2.127101456727524e-06, "loss": 1.1736, "step": 18630 }, { "epoch": 0.56, "learning_rate": 2.1268602671487545e-06, "loss": 1.1367, "step": 18631 }, { "epoch": 0.56, "learning_rate": 2.126619081122096e-06, "loss": 1.0654, "step": 18632 }, { "epoch": 0.56, "learning_rate": 2.126377898649844e-06, "loss": 1.0835, "step": 18633 }, { "epoch": 0.56, "learning_rate": 2.1261367197342943e-06, "loss": 1.1249, "step": 18634 }, { "epoch": 0.56, "learning_rate": 2.1258955443777434e-06, "loss": 1.1184, "step": 18635 }, { "epoch": 0.56, "learning_rate": 2.1256543725824863e-06, "loss": 1.0929, "step": 18636 }, { "epoch": 0.56, "learning_rate": 2.1254132043508195e-06, "loss": 1.2515, "step": 18637 }, { "epoch": 0.56, "learning_rate": 2.1251720396850386e-06, "loss": 1.0442, "step": 18638 }, { "epoch": 0.56, "learning_rate": 2.124930878587439e-06, "loss": 1.2523, "step": 18639 }, { "epoch": 0.56, "learning_rate": 2.1246897210603173e-06, "loss": 1.0479, "step": 18640 }, { "epoch": 0.56, "learning_rate": 2.124448567105968e-06, "loss": 1.0969, "step": 18641 }, { "epoch": 0.56, "learning_rate": 2.1242074167266888e-06, "loss": 1.2275, "step": 18642 }, { "epoch": 0.56, "learning_rate": 2.123966269924773e-06, "loss": 1.1541, "step": 18643 }, { "epoch": 0.56, "learning_rate": 2.1237251267025172e-06, "loss": 1.2259, "step": 18644 }, { "epoch": 0.56, "learning_rate": 2.123483987062217e-06, "loss": 1.0691, "step": 18645 }, { "epoch": 0.56, "learning_rate": 2.1232428510061676e-06, "loss": 1.1459, "step": 18646 }, { "epoch": 0.56, "learning_rate": 2.1230017185366664e-06, "loss": 1.1993, "step": 18647 }, { "epoch": 0.56, "learning_rate": 2.1227605896560057e-06, "loss": 1.2392, "step": 18648 }, { "epoch": 0.56, "learning_rate": 2.1225194643664827e-06, "loss": 1.1979, "step": 18649 }, { "epoch": 0.56, "learning_rate": 2.1222783426703927e-06, "loss": 1.2405, "step": 18650 }, { "epoch": 0.56, "learning_rate": 2.1220372245700313e-06, "loss": 1.061, "step": 18651 }, { "epoch": 0.56, "learning_rate": 2.121796110067693e-06, "loss": 1.1404, "step": 18652 }, { "epoch": 0.56, "learning_rate": 2.1215549991656738e-06, "loss": 1.1298, "step": 18653 }, { "epoch": 0.56, "learning_rate": 2.1213138918662687e-06, "loss": 1.0955, "step": 18654 }, { "epoch": 0.56, "learning_rate": 2.121072788171774e-06, "loss": 1.0924, "step": 18655 }, { "epoch": 0.56, "learning_rate": 2.1208316880844825e-06, "loss": 1.125, "step": 18656 }, { "epoch": 0.56, "learning_rate": 2.120590591606691e-06, "loss": 1.0315, "step": 18657 }, { "epoch": 0.56, "learning_rate": 2.1203494987406943e-06, "loss": 1.2681, "step": 18658 }, { "epoch": 0.56, "learning_rate": 2.1201084094887873e-06, "loss": 1.1536, "step": 18659 }, { "epoch": 0.56, "learning_rate": 2.1198673238532667e-06, "loss": 1.1724, "step": 18660 }, { "epoch": 0.56, "learning_rate": 2.1196262418364245e-06, "loss": 1.1602, "step": 18661 }, { "epoch": 0.56, "learning_rate": 2.119385163440558e-06, "loss": 1.1614, "step": 18662 }, { "epoch": 0.56, "learning_rate": 2.119144088667961e-06, "loss": 1.1638, "step": 18663 }, { "epoch": 0.56, "learning_rate": 2.1189030175209295e-06, "loss": 1.1305, "step": 18664 }, { "epoch": 0.56, "learning_rate": 2.118661950001757e-06, "loss": 1.0798, "step": 18665 }, { "epoch": 0.56, "learning_rate": 2.1184208861127393e-06, "loss": 1.1401, "step": 18666 }, { "epoch": 0.56, "learning_rate": 2.118179825856171e-06, "loss": 1.173, "step": 18667 }, { "epoch": 0.56, "learning_rate": 2.1179387692343478e-06, "loss": 1.1537, "step": 18668 }, { "epoch": 0.56, "learning_rate": 2.117697716249563e-06, "loss": 1.1787, "step": 18669 }, { "epoch": 0.56, "learning_rate": 2.117456666904111e-06, "loss": 1.0981, "step": 18670 }, { "epoch": 0.56, "learning_rate": 2.1172156212002878e-06, "loss": 0.9902, "step": 18671 }, { "epoch": 0.56, "learning_rate": 2.116974579140387e-06, "loss": 1.0784, "step": 18672 }, { "epoch": 0.56, "learning_rate": 2.1167335407267053e-06, "loss": 1.2532, "step": 18673 }, { "epoch": 0.56, "learning_rate": 2.1164925059615342e-06, "loss": 1.3434, "step": 18674 }, { "epoch": 0.56, "learning_rate": 2.11625147484717e-06, "loss": 1.1053, "step": 18675 }, { "epoch": 0.56, "learning_rate": 2.1160104473859074e-06, "loss": 1.1656, "step": 18676 }, { "epoch": 0.56, "learning_rate": 2.1157694235800404e-06, "loss": 1.0931, "step": 18677 }, { "epoch": 0.56, "learning_rate": 2.115528403431863e-06, "loss": 1.0064, "step": 18678 }, { "epoch": 0.56, "learning_rate": 2.11528738694367e-06, "loss": 1.1109, "step": 18679 }, { "epoch": 0.56, "learning_rate": 2.1150463741177557e-06, "loss": 1.1467, "step": 18680 }, { "epoch": 0.56, "learning_rate": 2.114805364956416e-06, "loss": 1.1617, "step": 18681 }, { "epoch": 0.56, "learning_rate": 2.114564359461942e-06, "loss": 1.0472, "step": 18682 }, { "epoch": 0.56, "learning_rate": 2.1143233576366305e-06, "loss": 1.1259, "step": 18683 }, { "epoch": 0.56, "learning_rate": 2.1140823594827743e-06, "loss": 1.1356, "step": 18684 }, { "epoch": 0.56, "learning_rate": 2.113841365002668e-06, "loss": 1.1784, "step": 18685 }, { "epoch": 0.56, "learning_rate": 2.1136003741986075e-06, "loss": 1.1871, "step": 18686 }, { "epoch": 0.56, "learning_rate": 2.113359387072884e-06, "loss": 1.1859, "step": 18687 }, { "epoch": 0.56, "learning_rate": 2.113118403627793e-06, "loss": 1.1255, "step": 18688 }, { "epoch": 0.56, "learning_rate": 2.1128774238656284e-06, "loss": 1.1266, "step": 18689 }, { "epoch": 0.56, "learning_rate": 2.1126364477886847e-06, "loss": 1.1381, "step": 18690 }, { "epoch": 0.56, "learning_rate": 2.1123954753992554e-06, "loss": 1.1759, "step": 18691 }, { "epoch": 0.56, "learning_rate": 2.112154506699634e-06, "loss": 1.1434, "step": 18692 }, { "epoch": 0.56, "learning_rate": 2.1119135416921152e-06, "loss": 1.2115, "step": 18693 }, { "epoch": 0.56, "learning_rate": 2.1116725803789936e-06, "loss": 1.072, "step": 18694 }, { "epoch": 0.56, "learning_rate": 2.111431622762561e-06, "loss": 1.1347, "step": 18695 }, { "epoch": 0.56, "learning_rate": 2.1111906688451117e-06, "loss": 1.1581, "step": 18696 }, { "epoch": 0.56, "learning_rate": 2.1109497186289403e-06, "loss": 1.1279, "step": 18697 }, { "epoch": 0.56, "learning_rate": 2.1107087721163404e-06, "loss": 1.109, "step": 18698 }, { "epoch": 0.56, "learning_rate": 2.1104678293096067e-06, "loss": 1.1539, "step": 18699 }, { "epoch": 0.56, "learning_rate": 2.1102268902110303e-06, "loss": 1.1989, "step": 18700 }, { "epoch": 0.56, "learning_rate": 2.109985954822906e-06, "loss": 1.0609, "step": 18701 }, { "epoch": 0.56, "learning_rate": 2.1097450231475276e-06, "loss": 1.0835, "step": 18702 }, { "epoch": 0.56, "learning_rate": 2.1095040951871896e-06, "loss": 1.0323, "step": 18703 }, { "epoch": 0.56, "learning_rate": 2.1092631709441837e-06, "loss": 1.1834, "step": 18704 }, { "epoch": 0.56, "learning_rate": 2.1090222504208044e-06, "loss": 1.2001, "step": 18705 }, { "epoch": 0.56, "learning_rate": 2.1087813336193454e-06, "loss": 1.089, "step": 18706 }, { "epoch": 0.56, "learning_rate": 2.1085404205420997e-06, "loss": 1.0908, "step": 18707 }, { "epoch": 0.56, "learning_rate": 2.1082995111913602e-06, "loss": 1.1307, "step": 18708 }, { "epoch": 0.56, "learning_rate": 2.1080586055694203e-06, "loss": 1.0406, "step": 18709 }, { "epoch": 0.56, "learning_rate": 2.107817703678574e-06, "loss": 1.1763, "step": 18710 }, { "epoch": 0.56, "learning_rate": 2.107576805521114e-06, "loss": 1.2608, "step": 18711 }, { "epoch": 0.56, "learning_rate": 2.1073359110993354e-06, "loss": 1.1418, "step": 18712 }, { "epoch": 0.56, "learning_rate": 2.107095020415529e-06, "loss": 1.1248, "step": 18713 }, { "epoch": 0.56, "learning_rate": 2.106854133471988e-06, "loss": 1.0106, "step": 18714 }, { "epoch": 0.56, "learning_rate": 2.1066132502710064e-06, "loss": 0.9861, "step": 18715 }, { "epoch": 0.56, "learning_rate": 2.106372370814878e-06, "loss": 1.0226, "step": 18716 }, { "epoch": 0.56, "learning_rate": 2.106131495105895e-06, "loss": 1.09, "step": 18717 }, { "epoch": 0.56, "learning_rate": 2.10589062314635e-06, "loss": 1.1647, "step": 18718 }, { "epoch": 0.56, "learning_rate": 2.1056497549385363e-06, "loss": 1.1434, "step": 18719 }, { "epoch": 0.56, "learning_rate": 2.1054088904847477e-06, "loss": 1.0916, "step": 18720 }, { "epoch": 0.56, "learning_rate": 2.1051680297872758e-06, "loss": 1.0136, "step": 18721 }, { "epoch": 0.56, "learning_rate": 2.1049271728484143e-06, "loss": 1.0704, "step": 18722 }, { "epoch": 0.56, "learning_rate": 2.1046863196704553e-06, "loss": 1.1168, "step": 18723 }, { "epoch": 0.56, "learning_rate": 2.1044454702556927e-06, "loss": 1.1318, "step": 18724 }, { "epoch": 0.56, "learning_rate": 2.1042046246064196e-06, "loss": 1.1801, "step": 18725 }, { "epoch": 0.56, "learning_rate": 2.1039637827249266e-06, "loss": 1.0715, "step": 18726 }, { "epoch": 0.56, "learning_rate": 2.103722944613508e-06, "loss": 1.182, "step": 18727 }, { "epoch": 0.56, "learning_rate": 2.1034821102744556e-06, "loss": 1.0845, "step": 18728 }, { "epoch": 0.56, "learning_rate": 2.1032412797100643e-06, "loss": 1.0723, "step": 18729 }, { "epoch": 0.56, "learning_rate": 2.1030004529226234e-06, "loss": 1.2538, "step": 18730 }, { "epoch": 0.56, "learning_rate": 2.102759629914427e-06, "loss": 1.1334, "step": 18731 }, { "epoch": 0.56, "learning_rate": 2.102518810687768e-06, "loss": 1.0167, "step": 18732 }, { "epoch": 0.56, "learning_rate": 2.1022779952449383e-06, "loss": 1.1067, "step": 18733 }, { "epoch": 0.56, "learning_rate": 2.1020371835882308e-06, "loss": 1.1436, "step": 18734 }, { "epoch": 0.56, "learning_rate": 2.1017963757199374e-06, "loss": 1.1401, "step": 18735 }, { "epoch": 0.56, "learning_rate": 2.10155557164235e-06, "loss": 1.2282, "step": 18736 }, { "epoch": 0.56, "learning_rate": 2.1013147713577626e-06, "loss": 1.1786, "step": 18737 }, { "epoch": 0.56, "learning_rate": 2.101073974868467e-06, "loss": 1.1229, "step": 18738 }, { "epoch": 0.56, "learning_rate": 2.1008331821767543e-06, "loss": 1.092, "step": 18739 }, { "epoch": 0.56, "learning_rate": 2.1005923932849174e-06, "loss": 1.1306, "step": 18740 }, { "epoch": 0.56, "learning_rate": 2.1003516081952483e-06, "loss": 1.0541, "step": 18741 }, { "epoch": 0.56, "learning_rate": 2.1001108269100413e-06, "loss": 1.0657, "step": 18742 }, { "epoch": 0.56, "learning_rate": 2.099870049431585e-06, "loss": 1.191, "step": 18743 }, { "epoch": 0.56, "learning_rate": 2.0996292757621727e-06, "loss": 1.1149, "step": 18744 }, { "epoch": 0.56, "learning_rate": 2.0993885059040974e-06, "loss": 1.1442, "step": 18745 }, { "epoch": 0.56, "learning_rate": 2.099147739859651e-06, "loss": 1.1466, "step": 18746 }, { "epoch": 0.56, "learning_rate": 2.098906977631125e-06, "loss": 1.1511, "step": 18747 }, { "epoch": 0.56, "learning_rate": 2.0986662192208108e-06, "loss": 1.1431, "step": 18748 }, { "epoch": 0.56, "learning_rate": 2.098425464631001e-06, "loss": 1.087, "step": 18749 }, { "epoch": 0.56, "learning_rate": 2.098184713863987e-06, "loss": 1.0081, "step": 18750 }, { "epoch": 0.56, "learning_rate": 2.0979439669220626e-06, "loss": 1.0108, "step": 18751 }, { "epoch": 0.56, "learning_rate": 2.097703223807517e-06, "loss": 1.0934, "step": 18752 }, { "epoch": 0.56, "learning_rate": 2.0974624845226427e-06, "loss": 1.0634, "step": 18753 }, { "epoch": 0.56, "learning_rate": 2.0972217490697316e-06, "loss": 1.1246, "step": 18754 }, { "epoch": 0.56, "learning_rate": 2.096981017451077e-06, "loss": 1.3098, "step": 18755 }, { "epoch": 0.57, "learning_rate": 2.0967402896689677e-06, "loss": 1.1605, "step": 18756 }, { "epoch": 0.57, "learning_rate": 2.0964995657256965e-06, "loss": 1.1138, "step": 18757 }, { "epoch": 0.57, "learning_rate": 2.096258845623555e-06, "loss": 1.0773, "step": 18758 }, { "epoch": 0.57, "learning_rate": 2.0960181293648357e-06, "loss": 1.0995, "step": 18759 }, { "epoch": 0.57, "learning_rate": 2.0957774169518284e-06, "loss": 1.092, "step": 18760 }, { "epoch": 0.57, "learning_rate": 2.0955367083868254e-06, "loss": 1.1152, "step": 18761 }, { "epoch": 0.57, "learning_rate": 2.0952960036721186e-06, "loss": 0.9997, "step": 18762 }, { "epoch": 0.57, "learning_rate": 2.0950553028099997e-06, "loss": 1.1654, "step": 18763 }, { "epoch": 0.57, "learning_rate": 2.094814605802758e-06, "loss": 1.1587, "step": 18764 }, { "epoch": 0.57, "learning_rate": 2.0945739126526864e-06, "loss": 1.0474, "step": 18765 }, { "epoch": 0.57, "learning_rate": 2.0943332233620756e-06, "loss": 1.1011, "step": 18766 }, { "epoch": 0.57, "learning_rate": 2.0940925379332176e-06, "loss": 1.129, "step": 18767 }, { "epoch": 0.57, "learning_rate": 2.0938518563684037e-06, "loss": 1.1016, "step": 18768 }, { "epoch": 0.57, "learning_rate": 2.0936111786699237e-06, "loss": 1.1389, "step": 18769 }, { "epoch": 0.57, "learning_rate": 2.09337050484007e-06, "loss": 1.1968, "step": 18770 }, { "epoch": 0.57, "learning_rate": 2.0931298348811323e-06, "loss": 0.9937, "step": 18771 }, { "epoch": 0.57, "learning_rate": 2.0928891687954037e-06, "loss": 1.1478, "step": 18772 }, { "epoch": 0.57, "learning_rate": 2.0926485065851736e-06, "loss": 1.1194, "step": 18773 }, { "epoch": 0.57, "learning_rate": 2.0924078482527336e-06, "loss": 1.256, "step": 18774 }, { "epoch": 0.57, "learning_rate": 2.0921671938003745e-06, "loss": 1.0274, "step": 18775 }, { "epoch": 0.57, "learning_rate": 2.0919265432303884e-06, "loss": 1.2088, "step": 18776 }, { "epoch": 0.57, "learning_rate": 2.091685896545064e-06, "loss": 1.1266, "step": 18777 }, { "epoch": 0.57, "learning_rate": 2.0914452537466936e-06, "loss": 1.1248, "step": 18778 }, { "epoch": 0.57, "learning_rate": 2.091204614837567e-06, "loss": 1.1652, "step": 18779 }, { "epoch": 0.57, "learning_rate": 2.0909639798199756e-06, "loss": 1.2325, "step": 18780 }, { "epoch": 0.57, "learning_rate": 2.0907233486962113e-06, "loss": 1.1396, "step": 18781 }, { "epoch": 0.57, "learning_rate": 2.0904827214685626e-06, "loss": 1.0755, "step": 18782 }, { "epoch": 0.57, "learning_rate": 2.090242098139321e-06, "loss": 1.1249, "step": 18783 }, { "epoch": 0.57, "learning_rate": 2.0900014787107775e-06, "loss": 1.0887, "step": 18784 }, { "epoch": 0.57, "learning_rate": 2.089760863185223e-06, "loss": 1.0715, "step": 18785 }, { "epoch": 0.57, "learning_rate": 2.089520251564947e-06, "loss": 1.1662, "step": 18786 }, { "epoch": 0.57, "learning_rate": 2.0892796438522405e-06, "loss": 1.1879, "step": 18787 }, { "epoch": 0.57, "learning_rate": 2.089039040049394e-06, "loss": 1.1385, "step": 18788 }, { "epoch": 0.57, "learning_rate": 2.0887984401586985e-06, "loss": 1.041, "step": 18789 }, { "epoch": 0.57, "learning_rate": 2.0885578441824435e-06, "loss": 1.1868, "step": 18790 }, { "epoch": 0.57, "learning_rate": 2.088317252122919e-06, "loss": 1.0262, "step": 18791 }, { "epoch": 0.57, "learning_rate": 2.0880766639824165e-06, "loss": 1.1484, "step": 18792 }, { "epoch": 0.57, "learning_rate": 2.0878360797632257e-06, "loss": 1.1548, "step": 18793 }, { "epoch": 0.57, "learning_rate": 2.0875954994676376e-06, "loss": 1.1339, "step": 18794 }, { "epoch": 0.57, "learning_rate": 2.087354923097941e-06, "loss": 1.0225, "step": 18795 }, { "epoch": 0.57, "learning_rate": 2.0871143506564265e-06, "loss": 1.106, "step": 18796 }, { "epoch": 0.57, "learning_rate": 2.0868737821453846e-06, "loss": 1.0719, "step": 18797 }, { "epoch": 0.57, "learning_rate": 2.086633217567106e-06, "loss": 1.0817, "step": 18798 }, { "epoch": 0.57, "learning_rate": 2.0863926569238797e-06, "loss": 1.0107, "step": 18799 }, { "epoch": 0.57, "learning_rate": 2.086152100217996e-06, "loss": 1.0624, "step": 18800 }, { "epoch": 0.57, "learning_rate": 2.0859115474517454e-06, "loss": 1.1635, "step": 18801 }, { "epoch": 0.57, "learning_rate": 2.0856709986274175e-06, "loss": 1.0285, "step": 18802 }, { "epoch": 0.57, "learning_rate": 2.0854304537473014e-06, "loss": 1.1201, "step": 18803 }, { "epoch": 0.57, "learning_rate": 2.085189912813688e-06, "loss": 1.1794, "step": 18804 }, { "epoch": 0.57, "learning_rate": 2.084949375828867e-06, "loss": 1.2799, "step": 18805 }, { "epoch": 0.57, "learning_rate": 2.0847088427951274e-06, "loss": 1.2022, "step": 18806 }, { "epoch": 0.57, "learning_rate": 2.084468313714761e-06, "loss": 1.1957, "step": 18807 }, { "epoch": 0.57, "learning_rate": 2.0842277885900553e-06, "loss": 1.1544, "step": 18808 }, { "epoch": 0.57, "learning_rate": 2.083987267423301e-06, "loss": 1.0029, "step": 18809 }, { "epoch": 0.57, "learning_rate": 2.0837467502167867e-06, "loss": 0.9846, "step": 18810 }, { "epoch": 0.57, "learning_rate": 2.0835062369728044e-06, "loss": 1.0344, "step": 18811 }, { "epoch": 0.57, "learning_rate": 2.0832657276936415e-06, "loss": 1.1927, "step": 18812 }, { "epoch": 0.57, "learning_rate": 2.083025222381588e-06, "loss": 1.2679, "step": 18813 }, { "epoch": 0.57, "learning_rate": 2.0827847210389328e-06, "loss": 1.0879, "step": 18814 }, { "epoch": 0.57, "learning_rate": 2.0825442236679676e-06, "loss": 1.0745, "step": 18815 }, { "epoch": 0.57, "learning_rate": 2.082303730270979e-06, "loss": 1.1147, "step": 18816 }, { "epoch": 0.57, "learning_rate": 2.0820632408502584e-06, "loss": 1.119, "step": 18817 }, { "epoch": 0.57, "learning_rate": 2.081822755408094e-06, "loss": 1.1328, "step": 18818 }, { "epoch": 0.57, "learning_rate": 2.0815822739467754e-06, "loss": 1.0752, "step": 18819 }, { "epoch": 0.57, "learning_rate": 2.0813417964685937e-06, "loss": 1.1285, "step": 18820 }, { "epoch": 0.57, "learning_rate": 2.0811013229758355e-06, "loss": 0.9761, "step": 18821 }, { "epoch": 0.57, "learning_rate": 2.0808608534707903e-06, "loss": 1.0932, "step": 18822 }, { "epoch": 0.57, "learning_rate": 2.0806203879557483e-06, "loss": 1.1645, "step": 18823 }, { "epoch": 0.57, "learning_rate": 2.0803799264329993e-06, "loss": 1.1281, "step": 18824 }, { "epoch": 0.57, "learning_rate": 2.08013946890483e-06, "loss": 1.0539, "step": 18825 }, { "epoch": 0.57, "learning_rate": 2.0798990153735306e-06, "loss": 1.1426, "step": 18826 }, { "epoch": 0.57, "learning_rate": 2.0796585658413906e-06, "loss": 1.0593, "step": 18827 }, { "epoch": 0.57, "learning_rate": 2.0794181203106993e-06, "loss": 1.1703, "step": 18828 }, { "epoch": 0.57, "learning_rate": 2.079177678783744e-06, "loss": 1.1115, "step": 18829 }, { "epoch": 0.57, "learning_rate": 2.078937241262815e-06, "loss": 1.0381, "step": 18830 }, { "epoch": 0.57, "learning_rate": 2.0786968077502e-06, "loss": 1.1208, "step": 18831 }, { "epoch": 0.57, "learning_rate": 2.078456378248189e-06, "loss": 1.0919, "step": 18832 }, { "epoch": 0.57, "learning_rate": 2.0782159527590712e-06, "loss": 1.0062, "step": 18833 }, { "epoch": 0.57, "learning_rate": 2.0779755312851334e-06, "loss": 1.016, "step": 18834 }, { "epoch": 0.57, "learning_rate": 2.077735113828665e-06, "loss": 1.0655, "step": 18835 }, { "epoch": 0.57, "learning_rate": 2.077494700391955e-06, "loss": 1.1531, "step": 18836 }, { "epoch": 0.57, "learning_rate": 2.0772542909772935e-06, "loss": 1.3226, "step": 18837 }, { "epoch": 0.57, "learning_rate": 2.077013885586966e-06, "loss": 1.1322, "step": 18838 }, { "epoch": 0.57, "learning_rate": 2.0767734842232628e-06, "loss": 1.1211, "step": 18839 }, { "epoch": 0.57, "learning_rate": 2.076533086888472e-06, "loss": 1.1452, "step": 18840 }, { "epoch": 0.57, "learning_rate": 2.076292693584883e-06, "loss": 1.1699, "step": 18841 }, { "epoch": 0.57, "learning_rate": 2.076052304314783e-06, "loss": 1.1524, "step": 18842 }, { "epoch": 0.57, "learning_rate": 2.0758119190804603e-06, "loss": 1.167, "step": 18843 }, { "epoch": 0.57, "learning_rate": 2.0755715378842046e-06, "loss": 1.1564, "step": 18844 }, { "epoch": 0.57, "learning_rate": 2.075331160728303e-06, "loss": 1.0848, "step": 18845 }, { "epoch": 0.57, "learning_rate": 2.0750907876150454e-06, "loss": 1.0966, "step": 18846 }, { "epoch": 0.57, "learning_rate": 2.074850418546718e-06, "loss": 1.0629, "step": 18847 }, { "epoch": 0.57, "learning_rate": 2.0746100535256097e-06, "loss": 1.1579, "step": 18848 }, { "epoch": 0.57, "learning_rate": 2.074369692554009e-06, "loss": 1.0831, "step": 18849 }, { "epoch": 0.57, "learning_rate": 2.0741293356342045e-06, "loss": 1.1066, "step": 18850 }, { "epoch": 0.57, "learning_rate": 2.0738889827684827e-06, "loss": 1.1666, "step": 18851 }, { "epoch": 0.57, "learning_rate": 2.0736486339591327e-06, "loss": 1.0728, "step": 18852 }, { "epoch": 0.57, "learning_rate": 2.0734082892084423e-06, "loss": 1.0913, "step": 18853 }, { "epoch": 0.57, "learning_rate": 2.0731679485187e-06, "loss": 1.1466, "step": 18854 }, { "epoch": 0.57, "learning_rate": 2.072927611892193e-06, "loss": 0.9597, "step": 18855 }, { "epoch": 0.57, "learning_rate": 2.072687279331209e-06, "loss": 1.1471, "step": 18856 }, { "epoch": 0.57, "learning_rate": 2.0724469508380367e-06, "loss": 1.1277, "step": 18857 }, { "epoch": 0.57, "learning_rate": 2.072206626414963e-06, "loss": 1.1243, "step": 18858 }, { "epoch": 0.57, "learning_rate": 2.0719663060642777e-06, "loss": 1.0801, "step": 18859 }, { "epoch": 0.57, "learning_rate": 2.071725989788266e-06, "loss": 1.22, "step": 18860 }, { "epoch": 0.57, "learning_rate": 2.0714856775892165e-06, "loss": 1.2311, "step": 18861 }, { "epoch": 0.57, "learning_rate": 2.0712453694694167e-06, "loss": 0.9444, "step": 18862 }, { "epoch": 0.57, "learning_rate": 2.071005065431156e-06, "loss": 1.0182, "step": 18863 }, { "epoch": 0.57, "learning_rate": 2.070764765476719e-06, "loss": 1.1797, "step": 18864 }, { "epoch": 0.57, "learning_rate": 2.070524469608395e-06, "loss": 1.1336, "step": 18865 }, { "epoch": 0.57, "learning_rate": 2.070284177828471e-06, "loss": 1.1034, "step": 18866 }, { "epoch": 0.57, "learning_rate": 2.0700438901392355e-06, "loss": 1.1222, "step": 18867 }, { "epoch": 0.57, "learning_rate": 2.0698036065429746e-06, "loss": 1.3265, "step": 18868 }, { "epoch": 0.57, "learning_rate": 2.0695633270419757e-06, "loss": 1.0816, "step": 18869 }, { "epoch": 0.57, "learning_rate": 2.069323051638527e-06, "loss": 1.0903, "step": 18870 }, { "epoch": 0.57, "learning_rate": 2.0690827803349156e-06, "loss": 1.1207, "step": 18871 }, { "epoch": 0.57, "learning_rate": 2.068842513133429e-06, "loss": 1.0399, "step": 18872 }, { "epoch": 0.57, "learning_rate": 2.0686022500363533e-06, "loss": 1.1518, "step": 18873 }, { "epoch": 0.57, "learning_rate": 2.0683619910459764e-06, "loss": 1.2184, "step": 18874 }, { "epoch": 0.57, "learning_rate": 2.068121736164585e-06, "loss": 1.2869, "step": 18875 }, { "epoch": 0.57, "learning_rate": 2.0678814853944685e-06, "loss": 1.1581, "step": 18876 }, { "epoch": 0.57, "learning_rate": 2.0676412387379107e-06, "loss": 1.1331, "step": 18877 }, { "epoch": 0.57, "learning_rate": 2.0674009961972004e-06, "loss": 1.0408, "step": 18878 }, { "epoch": 0.57, "learning_rate": 2.067160757774624e-06, "loss": 1.0908, "step": 18879 }, { "epoch": 0.57, "learning_rate": 2.066920523472469e-06, "loss": 1.28, "step": 18880 }, { "epoch": 0.57, "learning_rate": 2.0666802932930218e-06, "loss": 1.1683, "step": 18881 }, { "epoch": 0.57, "learning_rate": 2.0664400672385702e-06, "loss": 1.2886, "step": 18882 }, { "epoch": 0.57, "learning_rate": 2.0661998453113998e-06, "loss": 1.1664, "step": 18883 }, { "epoch": 0.57, "learning_rate": 2.065959627513798e-06, "loss": 1.1499, "step": 18884 }, { "epoch": 0.57, "learning_rate": 2.0657194138480515e-06, "loss": 1.2281, "step": 18885 }, { "epoch": 0.57, "learning_rate": 2.0654792043164468e-06, "loss": 1.0354, "step": 18886 }, { "epoch": 0.57, "learning_rate": 2.065238998921271e-06, "loss": 1.1426, "step": 18887 }, { "epoch": 0.57, "learning_rate": 2.0649987976648102e-06, "loss": 1.2399, "step": 18888 }, { "epoch": 0.57, "learning_rate": 2.064758600549353e-06, "loss": 1.0776, "step": 18889 }, { "epoch": 0.57, "learning_rate": 2.0645184075771825e-06, "loss": 1.1086, "step": 18890 }, { "epoch": 0.57, "learning_rate": 2.0642782187505875e-06, "loss": 1.1361, "step": 18891 }, { "epoch": 0.57, "learning_rate": 2.064038034071854e-06, "loss": 1.0103, "step": 18892 }, { "epoch": 0.57, "learning_rate": 2.063797853543269e-06, "loss": 1.2328, "step": 18893 }, { "epoch": 0.57, "learning_rate": 2.063557677167118e-06, "loss": 1.0431, "step": 18894 }, { "epoch": 0.57, "learning_rate": 2.063317504945687e-06, "loss": 1.0508, "step": 18895 }, { "epoch": 0.57, "learning_rate": 2.0630773368812634e-06, "loss": 1.2059, "step": 18896 }, { "epoch": 0.57, "learning_rate": 2.062837172976133e-06, "loss": 1.0943, "step": 18897 }, { "epoch": 0.57, "learning_rate": 2.062597013232583e-06, "loss": 1.1365, "step": 18898 }, { "epoch": 0.57, "learning_rate": 2.062356857652898e-06, "loss": 1.103, "step": 18899 }, { "epoch": 0.57, "learning_rate": 2.062116706239365e-06, "loss": 1.07, "step": 18900 }, { "epoch": 0.57, "learning_rate": 2.06187655899427e-06, "loss": 1.2076, "step": 18901 }, { "epoch": 0.57, "learning_rate": 2.0616364159199006e-06, "loss": 1.1379, "step": 18902 }, { "epoch": 0.57, "learning_rate": 2.06139627701854e-06, "loss": 1.0497, "step": 18903 }, { "epoch": 0.57, "learning_rate": 2.061156142292476e-06, "loss": 1.1193, "step": 18904 }, { "epoch": 0.57, "learning_rate": 2.0609160117439937e-06, "loss": 1.1213, "step": 18905 }, { "epoch": 0.57, "learning_rate": 2.0606758853753805e-06, "loss": 1.0759, "step": 18906 }, { "epoch": 0.57, "learning_rate": 2.0604357631889206e-06, "loss": 1.1093, "step": 18907 }, { "epoch": 0.57, "learning_rate": 2.0601956451869003e-06, "loss": 1.0669, "step": 18908 }, { "epoch": 0.57, "learning_rate": 2.0599555313716055e-06, "loss": 1.1873, "step": 18909 }, { "epoch": 0.57, "learning_rate": 2.0597154217453224e-06, "loss": 1.0776, "step": 18910 }, { "epoch": 0.57, "learning_rate": 2.059475316310337e-06, "loss": 1.1097, "step": 18911 }, { "epoch": 0.57, "learning_rate": 2.0592352150689333e-06, "loss": 1.119, "step": 18912 }, { "epoch": 0.57, "learning_rate": 2.0589951180233984e-06, "loss": 0.9672, "step": 18913 }, { "epoch": 0.57, "learning_rate": 2.058755025176018e-06, "loss": 1.0205, "step": 18914 }, { "epoch": 0.57, "learning_rate": 2.0585149365290778e-06, "loss": 1.0718, "step": 18915 }, { "epoch": 0.57, "learning_rate": 2.0582748520848618e-06, "loss": 1.1952, "step": 18916 }, { "epoch": 0.57, "learning_rate": 2.0580347718456566e-06, "loss": 1.1796, "step": 18917 }, { "epoch": 0.57, "learning_rate": 2.0577946958137475e-06, "loss": 1.1998, "step": 18918 }, { "epoch": 0.57, "learning_rate": 2.0575546239914214e-06, "loss": 1.2219, "step": 18919 }, { "epoch": 0.57, "learning_rate": 2.0573145563809603e-06, "loss": 1.09, "step": 18920 }, { "epoch": 0.57, "learning_rate": 2.057074492984652e-06, "loss": 1.1005, "step": 18921 }, { "epoch": 0.57, "learning_rate": 2.056834433804781e-06, "loss": 1.1562, "step": 18922 }, { "epoch": 0.57, "learning_rate": 2.056594378843633e-06, "loss": 1.1665, "step": 18923 }, { "epoch": 0.57, "learning_rate": 2.0563543281034933e-06, "loss": 1.055, "step": 18924 }, { "epoch": 0.57, "learning_rate": 2.0561142815866463e-06, "loss": 1.1147, "step": 18925 }, { "epoch": 0.57, "learning_rate": 2.0558742392953772e-06, "loss": 1.047, "step": 18926 }, { "epoch": 0.57, "learning_rate": 2.0556342012319716e-06, "loss": 1.2299, "step": 18927 }, { "epoch": 0.57, "learning_rate": 2.0553941673987153e-06, "loss": 1.0388, "step": 18928 }, { "epoch": 0.57, "learning_rate": 2.0551541377978917e-06, "loss": 1.1548, "step": 18929 }, { "epoch": 0.57, "learning_rate": 2.0549141124317864e-06, "loss": 1.2458, "step": 18930 }, { "epoch": 0.57, "learning_rate": 2.0546740913026844e-06, "loss": 1.1918, "step": 18931 }, { "epoch": 0.57, "learning_rate": 2.0544340744128717e-06, "loss": 1.0829, "step": 18932 }, { "epoch": 0.57, "learning_rate": 2.0541940617646307e-06, "loss": 1.0366, "step": 18933 }, { "epoch": 0.57, "learning_rate": 2.0539540533602476e-06, "loss": 0.9856, "step": 18934 }, { "epoch": 0.57, "learning_rate": 2.053714049202007e-06, "loss": 1.1104, "step": 18935 }, { "epoch": 0.57, "learning_rate": 2.0534740492921947e-06, "loss": 1.1593, "step": 18936 }, { "epoch": 0.57, "learning_rate": 2.0532340536330934e-06, "loss": 1.1942, "step": 18937 }, { "epoch": 0.57, "learning_rate": 2.052994062226989e-06, "loss": 1.0866, "step": 18938 }, { "epoch": 0.57, "learning_rate": 2.0527540750761652e-06, "loss": 1.0982, "step": 18939 }, { "epoch": 0.57, "learning_rate": 2.052514092182908e-06, "loss": 1.083, "step": 18940 }, { "epoch": 0.57, "learning_rate": 2.052274113549502e-06, "loss": 1.0805, "step": 18941 }, { "epoch": 0.57, "learning_rate": 2.0520341391782296e-06, "loss": 1.133, "step": 18942 }, { "epoch": 0.57, "learning_rate": 2.051794169071377e-06, "loss": 1.0461, "step": 18943 }, { "epoch": 0.57, "learning_rate": 2.051554203231227e-06, "loss": 1.1024, "step": 18944 }, { "epoch": 0.57, "learning_rate": 2.0513142416600666e-06, "loss": 1.1644, "step": 18945 }, { "epoch": 0.57, "learning_rate": 2.051074284360178e-06, "loss": 0.9968, "step": 18946 }, { "epoch": 0.57, "learning_rate": 2.050834331333845e-06, "loss": 1.0734, "step": 18947 }, { "epoch": 0.57, "learning_rate": 2.0505943825833533e-06, "loss": 1.0579, "step": 18948 }, { "epoch": 0.57, "learning_rate": 2.0503544381109876e-06, "loss": 1.11, "step": 18949 }, { "epoch": 0.57, "learning_rate": 2.05011449791903e-06, "loss": 1.2106, "step": 18950 }, { "epoch": 0.57, "learning_rate": 2.0498745620097658e-06, "loss": 1.1884, "step": 18951 }, { "epoch": 0.57, "learning_rate": 2.049634630385479e-06, "loss": 1.0637, "step": 18952 }, { "epoch": 0.57, "learning_rate": 2.049394703048454e-06, "loss": 1.1286, "step": 18953 }, { "epoch": 0.57, "learning_rate": 2.0491547800009746e-06, "loss": 1.0853, "step": 18954 }, { "epoch": 0.57, "learning_rate": 2.048914861245324e-06, "loss": 1.0969, "step": 18955 }, { "epoch": 0.57, "learning_rate": 2.048674946783787e-06, "loss": 1.1891, "step": 18956 }, { "epoch": 0.57, "learning_rate": 2.048435036618647e-06, "loss": 1.0439, "step": 18957 }, { "epoch": 0.57, "learning_rate": 2.0481951307521886e-06, "loss": 1.0482, "step": 18958 }, { "epoch": 0.57, "learning_rate": 2.0479552291866944e-06, "loss": 1.0192, "step": 18959 }, { "epoch": 0.57, "learning_rate": 2.047715331924448e-06, "loss": 1.2094, "step": 18960 }, { "epoch": 0.57, "learning_rate": 2.0474754389677346e-06, "loss": 1.1097, "step": 18961 }, { "epoch": 0.57, "learning_rate": 2.0472355503188372e-06, "loss": 1.1371, "step": 18962 }, { "epoch": 0.57, "learning_rate": 2.046995665980039e-06, "loss": 1.1376, "step": 18963 }, { "epoch": 0.57, "learning_rate": 2.046755785953624e-06, "loss": 1.1334, "step": 18964 }, { "epoch": 0.57, "learning_rate": 2.0465159102418755e-06, "loss": 0.9823, "step": 18965 }, { "epoch": 0.57, "learning_rate": 2.046276038847077e-06, "loss": 1.1208, "step": 18966 }, { "epoch": 0.57, "learning_rate": 2.0460361717715128e-06, "loss": 1.1799, "step": 18967 }, { "epoch": 0.57, "learning_rate": 2.045796309017465e-06, "loss": 1.2462, "step": 18968 }, { "epoch": 0.57, "learning_rate": 2.045556450587217e-06, "loss": 1.1092, "step": 18969 }, { "epoch": 0.57, "learning_rate": 2.0453165964830533e-06, "loss": 1.103, "step": 18970 }, { "epoch": 0.57, "learning_rate": 2.0450767467072575e-06, "loss": 1.126, "step": 18971 }, { "epoch": 0.57, "learning_rate": 2.044836901262111e-06, "loss": 1.0905, "step": 18972 }, { "epoch": 0.57, "learning_rate": 2.0445970601498984e-06, "loss": 1.0632, "step": 18973 }, { "epoch": 0.57, "learning_rate": 2.044357223372902e-06, "loss": 1.1043, "step": 18974 }, { "epoch": 0.57, "learning_rate": 2.0441173909334064e-06, "loss": 1.0909, "step": 18975 }, { "epoch": 0.57, "learning_rate": 2.0438775628336928e-06, "loss": 1.1003, "step": 18976 }, { "epoch": 0.57, "learning_rate": 2.043637739076045e-06, "loss": 1.1351, "step": 18977 }, { "epoch": 0.57, "learning_rate": 2.043397919662746e-06, "loss": 1.1525, "step": 18978 }, { "epoch": 0.57, "learning_rate": 2.043158104596079e-06, "loss": 1.2548, "step": 18979 }, { "epoch": 0.57, "learning_rate": 2.0429182938783276e-06, "loss": 1.0671, "step": 18980 }, { "epoch": 0.57, "learning_rate": 2.0426784875117734e-06, "loss": 1.0883, "step": 18981 }, { "epoch": 0.57, "learning_rate": 2.0424386854986993e-06, "loss": 1.1075, "step": 18982 }, { "epoch": 0.57, "learning_rate": 2.0421988878413887e-06, "loss": 1.0009, "step": 18983 }, { "epoch": 0.57, "learning_rate": 2.0419590945421254e-06, "loss": 1.1166, "step": 18984 }, { "epoch": 0.57, "learning_rate": 2.04171930560319e-06, "loss": 1.1307, "step": 18985 }, { "epoch": 0.57, "learning_rate": 2.0414795210268658e-06, "loss": 1.0761, "step": 18986 }, { "epoch": 0.57, "learning_rate": 2.041239740815436e-06, "loss": 1.161, "step": 18987 }, { "epoch": 0.57, "learning_rate": 2.0409999649711837e-06, "loss": 1.1465, "step": 18988 }, { "epoch": 0.57, "learning_rate": 2.0407601934963896e-06, "loss": 1.124, "step": 18989 }, { "epoch": 0.57, "learning_rate": 2.0405204263933375e-06, "loss": 1.0268, "step": 18990 }, { "epoch": 0.57, "learning_rate": 2.0402806636643098e-06, "loss": 1.0876, "step": 18991 }, { "epoch": 0.57, "learning_rate": 2.0400409053115883e-06, "loss": 1.1262, "step": 18992 }, { "epoch": 0.57, "learning_rate": 2.0398011513374566e-06, "loss": 1.2939, "step": 18993 }, { "epoch": 0.57, "learning_rate": 2.0395614017441955e-06, "loss": 1.1579, "step": 18994 }, { "epoch": 0.57, "learning_rate": 2.039321656534089e-06, "loss": 1.1363, "step": 18995 }, { "epoch": 0.57, "learning_rate": 2.0390819157094174e-06, "loss": 1.0834, "step": 18996 }, { "epoch": 0.57, "learning_rate": 2.0388421792724656e-06, "loss": 1.0829, "step": 18997 }, { "epoch": 0.57, "learning_rate": 2.0386024472255127e-06, "loss": 1.1733, "step": 18998 }, { "epoch": 0.57, "learning_rate": 2.038362719570843e-06, "loss": 1.2906, "step": 18999 }, { "epoch": 0.57, "learning_rate": 2.038122996310737e-06, "loss": 1.2875, "step": 19000 }, { "epoch": 0.57, "learning_rate": 2.0378832774474793e-06, "loss": 1.0918, "step": 19001 }, { "epoch": 0.57, "learning_rate": 2.037643562983349e-06, "loss": 1.0082, "step": 19002 }, { "epoch": 0.57, "learning_rate": 2.0374038529206293e-06, "loss": 1.1705, "step": 19003 }, { "epoch": 0.57, "learning_rate": 2.037164147261602e-06, "loss": 1.0469, "step": 19004 }, { "epoch": 0.57, "learning_rate": 2.0369244460085494e-06, "loss": 1.1171, "step": 19005 }, { "epoch": 0.57, "learning_rate": 2.0366847491637535e-06, "loss": 1.121, "step": 19006 }, { "epoch": 0.57, "learning_rate": 2.036445056729495e-06, "loss": 1.1407, "step": 19007 }, { "epoch": 0.57, "learning_rate": 2.036205368708056e-06, "loss": 1.2538, "step": 19008 }, { "epoch": 0.57, "learning_rate": 2.035965685101719e-06, "loss": 1.0401, "step": 19009 }, { "epoch": 0.57, "learning_rate": 2.035726005912766e-06, "loss": 1.1209, "step": 19010 }, { "epoch": 0.57, "learning_rate": 2.035486331143477e-06, "loss": 1.147, "step": 19011 }, { "epoch": 0.57, "learning_rate": 2.035246660796134e-06, "loss": 1.1494, "step": 19012 }, { "epoch": 0.57, "learning_rate": 2.0350069948730197e-06, "loss": 1.2766, "step": 19013 }, { "epoch": 0.57, "learning_rate": 2.0347673333764155e-06, "loss": 1.0643, "step": 19014 }, { "epoch": 0.57, "learning_rate": 2.034527676308601e-06, "loss": 1.2264, "step": 19015 }, { "epoch": 0.57, "learning_rate": 2.034288023671859e-06, "loss": 1.1591, "step": 19016 }, { "epoch": 0.57, "learning_rate": 2.034048375468471e-06, "loss": 1.1575, "step": 19017 }, { "epoch": 0.57, "learning_rate": 2.0338087317007172e-06, "loss": 1.1616, "step": 19018 }, { "epoch": 0.57, "learning_rate": 2.033569092370881e-06, "loss": 1.147, "step": 19019 }, { "epoch": 0.57, "learning_rate": 2.033329457481242e-06, "loss": 1.1446, "step": 19020 }, { "epoch": 0.57, "learning_rate": 2.0330898270340813e-06, "loss": 0.9487, "step": 19021 }, { "epoch": 0.57, "learning_rate": 2.0328502010316804e-06, "loss": 1.103, "step": 19022 }, { "epoch": 0.57, "learning_rate": 2.0326105794763224e-06, "loss": 1.1336, "step": 19023 }, { "epoch": 0.57, "learning_rate": 2.032370962370285e-06, "loss": 1.1639, "step": 19024 }, { "epoch": 0.57, "learning_rate": 2.032131349715851e-06, "loss": 1.2335, "step": 19025 }, { "epoch": 0.57, "learning_rate": 2.031891741515301e-06, "loss": 1.157, "step": 19026 }, { "epoch": 0.57, "learning_rate": 2.0316521377709176e-06, "loss": 1.1507, "step": 19027 }, { "epoch": 0.57, "learning_rate": 2.0314125384849794e-06, "loss": 1.1196, "step": 19028 }, { "epoch": 0.57, "learning_rate": 2.0311729436597674e-06, "loss": 1.167, "step": 19029 }, { "epoch": 0.57, "learning_rate": 2.0309333532975636e-06, "loss": 1.1636, "step": 19030 }, { "epoch": 0.57, "learning_rate": 2.030693767400648e-06, "loss": 1.1904, "step": 19031 }, { "epoch": 0.57, "learning_rate": 2.030454185971303e-06, "loss": 1.2346, "step": 19032 }, { "epoch": 0.57, "learning_rate": 2.030214609011807e-06, "loss": 1.1287, "step": 19033 }, { "epoch": 0.57, "learning_rate": 2.029975036524442e-06, "loss": 1.077, "step": 19034 }, { "epoch": 0.57, "learning_rate": 2.0297354685114878e-06, "loss": 1.1824, "step": 19035 }, { "epoch": 0.57, "learning_rate": 2.0294959049752265e-06, "loss": 1.2335, "step": 19036 }, { "epoch": 0.57, "learning_rate": 2.029256345917937e-06, "loss": 1.1252, "step": 19037 }, { "epoch": 0.57, "learning_rate": 2.0290167913419e-06, "loss": 1.0311, "step": 19038 }, { "epoch": 0.57, "learning_rate": 2.0287772412493964e-06, "loss": 1.0079, "step": 19039 }, { "epoch": 0.57, "learning_rate": 2.0285376956427076e-06, "loss": 1.1166, "step": 19040 }, { "epoch": 0.57, "learning_rate": 2.0282981545241122e-06, "loss": 1.032, "step": 19041 }, { "epoch": 0.57, "learning_rate": 2.0280586178958905e-06, "loss": 1.0739, "step": 19042 }, { "epoch": 0.57, "learning_rate": 2.0278190857603234e-06, "loss": 1.0985, "step": 19043 }, { "epoch": 0.57, "learning_rate": 2.0275795581196917e-06, "loss": 1.0217, "step": 19044 }, { "epoch": 0.57, "learning_rate": 2.0273400349762756e-06, "loss": 1.1251, "step": 19045 }, { "epoch": 0.57, "learning_rate": 2.0271005163323543e-06, "loss": 1.1213, "step": 19046 }, { "epoch": 0.57, "learning_rate": 2.0268610021902087e-06, "loss": 1.2316, "step": 19047 }, { "epoch": 0.57, "learning_rate": 2.0266214925521175e-06, "loss": 1.04, "step": 19048 }, { "epoch": 0.57, "learning_rate": 2.0263819874203627e-06, "loss": 1.2775, "step": 19049 }, { "epoch": 0.57, "learning_rate": 2.0261424867972225e-06, "loss": 0.9562, "step": 19050 }, { "epoch": 0.57, "learning_rate": 2.025902990684978e-06, "loss": 1.1459, "step": 19051 }, { "epoch": 0.57, "learning_rate": 2.0256634990859084e-06, "loss": 1.0688, "step": 19052 }, { "epoch": 0.57, "learning_rate": 2.025424012002295e-06, "loss": 1.0933, "step": 19053 }, { "epoch": 0.57, "learning_rate": 2.0251845294364153e-06, "loss": 1.0485, "step": 19054 }, { "epoch": 0.57, "learning_rate": 2.0249450513905503e-06, "loss": 1.1295, "step": 19055 }, { "epoch": 0.57, "learning_rate": 2.02470557786698e-06, "loss": 1.0942, "step": 19056 }, { "epoch": 0.57, "learning_rate": 2.0244661088679828e-06, "loss": 1.1894, "step": 19057 }, { "epoch": 0.57, "learning_rate": 2.0242266443958406e-06, "loss": 1.1822, "step": 19058 }, { "epoch": 0.57, "learning_rate": 2.0239871844528307e-06, "loss": 1.1255, "step": 19059 }, { "epoch": 0.57, "learning_rate": 2.023747729041234e-06, "loss": 1.1901, "step": 19060 }, { "epoch": 0.57, "learning_rate": 2.0235082781633286e-06, "loss": 1.2617, "step": 19061 }, { "epoch": 0.57, "learning_rate": 2.023268831821396e-06, "loss": 1.0411, "step": 19062 }, { "epoch": 0.57, "learning_rate": 2.023029390017714e-06, "loss": 1.1458, "step": 19063 }, { "epoch": 0.57, "learning_rate": 2.0227899527545623e-06, "loss": 1.2105, "step": 19064 }, { "epoch": 0.57, "learning_rate": 2.0225505200342206e-06, "loss": 1.1465, "step": 19065 }, { "epoch": 0.57, "learning_rate": 2.0223110918589687e-06, "loss": 1.0302, "step": 19066 }, { "epoch": 0.57, "learning_rate": 2.022071668231085e-06, "loss": 1.1502, "step": 19067 }, { "epoch": 0.57, "learning_rate": 2.0218322491528478e-06, "loss": 1.0882, "step": 19068 }, { "epoch": 0.57, "learning_rate": 2.021592834626538e-06, "loss": 1.1974, "step": 19069 }, { "epoch": 0.57, "learning_rate": 2.021353424654433e-06, "loss": 1.1443, "step": 19070 }, { "epoch": 0.57, "learning_rate": 2.021114019238815e-06, "loss": 1.1513, "step": 19071 }, { "epoch": 0.57, "learning_rate": 2.0208746183819594e-06, "loss": 0.9953, "step": 19072 }, { "epoch": 0.57, "learning_rate": 2.020635222086147e-06, "loss": 0.9911, "step": 19073 }, { "epoch": 0.57, "learning_rate": 2.0203958303536562e-06, "loss": 1.157, "step": 19074 }, { "epoch": 0.57, "learning_rate": 2.0201564431867663e-06, "loss": 1.1667, "step": 19075 }, { "epoch": 0.57, "learning_rate": 2.0199170605877557e-06, "loss": 1.2239, "step": 19076 }, { "epoch": 0.57, "learning_rate": 2.0196776825589037e-06, "loss": 1.0728, "step": 19077 }, { "epoch": 0.57, "learning_rate": 2.0194383091024885e-06, "loss": 1.105, "step": 19078 }, { "epoch": 0.57, "learning_rate": 2.01919894022079e-06, "loss": 1.0795, "step": 19079 }, { "epoch": 0.57, "learning_rate": 2.0189595759160857e-06, "loss": 1.1118, "step": 19080 }, { "epoch": 0.57, "learning_rate": 2.0187202161906543e-06, "loss": 1.22, "step": 19081 }, { "epoch": 0.57, "learning_rate": 2.018480861046774e-06, "loss": 1.1818, "step": 19082 }, { "epoch": 0.57, "learning_rate": 2.0182415104867246e-06, "loss": 1.022, "step": 19083 }, { "epoch": 0.57, "learning_rate": 2.0180021645127855e-06, "loss": 1.0918, "step": 19084 }, { "epoch": 0.57, "learning_rate": 2.017762823127232e-06, "loss": 1.0288, "step": 19085 }, { "epoch": 0.57, "learning_rate": 2.017523486332344e-06, "loss": 1.0913, "step": 19086 }, { "epoch": 0.57, "learning_rate": 2.0172841541304004e-06, "loss": 1.196, "step": 19087 }, { "epoch": 0.58, "learning_rate": 2.0170448265236795e-06, "loss": 1.141, "step": 19088 }, { "epoch": 0.58, "learning_rate": 2.0168055035144587e-06, "loss": 1.1917, "step": 19089 }, { "epoch": 0.58, "learning_rate": 2.0165661851050168e-06, "loss": 1.1063, "step": 19090 }, { "epoch": 0.58, "learning_rate": 2.0163268712976324e-06, "loss": 1.1159, "step": 19091 }, { "epoch": 0.58, "learning_rate": 2.016087562094584e-06, "loss": 1.3617, "step": 19092 }, { "epoch": 0.58, "learning_rate": 2.015848257498148e-06, "loss": 1.2057, "step": 19093 }, { "epoch": 0.58, "learning_rate": 2.015608957510603e-06, "loss": 1.0914, "step": 19094 }, { "epoch": 0.58, "learning_rate": 2.0153696621342277e-06, "loss": 1.0963, "step": 19095 }, { "epoch": 0.58, "learning_rate": 2.0151303713713e-06, "loss": 1.1005, "step": 19096 }, { "epoch": 0.58, "learning_rate": 2.0148910852240984e-06, "loss": 1.114, "step": 19097 }, { "epoch": 0.58, "learning_rate": 2.014651803694899e-06, "loss": 1.1111, "step": 19098 }, { "epoch": 0.58, "learning_rate": 2.014412526785981e-06, "loss": 1.1217, "step": 19099 }, { "epoch": 0.58, "learning_rate": 2.0141732544996214e-06, "loss": 1.1486, "step": 19100 }, { "epoch": 0.58, "learning_rate": 2.0139339868380994e-06, "loss": 1.1682, "step": 19101 }, { "epoch": 0.58, "learning_rate": 2.0136947238036906e-06, "loss": 1.1558, "step": 19102 }, { "epoch": 0.58, "learning_rate": 2.0134554653986747e-06, "loss": 1.0338, "step": 19103 }, { "epoch": 0.58, "learning_rate": 2.0132162116253277e-06, "loss": 1.2238, "step": 19104 }, { "epoch": 0.58, "learning_rate": 2.0129769624859298e-06, "loss": 1.181, "step": 19105 }, { "epoch": 0.58, "learning_rate": 2.012737717982755e-06, "loss": 0.9578, "step": 19106 }, { "epoch": 0.58, "learning_rate": 2.0124984781180823e-06, "loss": 1.1204, "step": 19107 }, { "epoch": 0.58, "learning_rate": 2.0122592428941893e-06, "loss": 1.1343, "step": 19108 }, { "epoch": 0.58, "learning_rate": 2.0120200123133536e-06, "loss": 1.0775, "step": 19109 }, { "epoch": 0.58, "learning_rate": 2.0117807863778537e-06, "loss": 1.0162, "step": 19110 }, { "epoch": 0.58, "learning_rate": 2.0115415650899643e-06, "loss": 1.0391, "step": 19111 }, { "epoch": 0.58, "learning_rate": 2.011302348451964e-06, "loss": 1.1704, "step": 19112 }, { "epoch": 0.58, "learning_rate": 2.0110631364661296e-06, "loss": 1.1089, "step": 19113 }, { "epoch": 0.58, "learning_rate": 2.01082392913474e-06, "loss": 1.0563, "step": 19114 }, { "epoch": 0.58, "learning_rate": 2.01058472646007e-06, "loss": 1.0824, "step": 19115 }, { "epoch": 0.58, "learning_rate": 2.010345528444397e-06, "loss": 1.087, "step": 19116 }, { "epoch": 0.58, "learning_rate": 2.0101063350899996e-06, "loss": 1.1051, "step": 19117 }, { "epoch": 0.58, "learning_rate": 2.009867146399155e-06, "loss": 1.1301, "step": 19118 }, { "epoch": 0.58, "learning_rate": 2.0096279623741376e-06, "loss": 1.0259, "step": 19119 }, { "epoch": 0.58, "learning_rate": 2.0093887830172264e-06, "loss": 1.1165, "step": 19120 }, { "epoch": 0.58, "learning_rate": 2.0091496083306972e-06, "loss": 1.0084, "step": 19121 }, { "epoch": 0.58, "learning_rate": 2.0089104383168288e-06, "loss": 1.1052, "step": 19122 }, { "epoch": 0.58, "learning_rate": 2.008671272977895e-06, "loss": 1.2023, "step": 19123 }, { "epoch": 0.58, "learning_rate": 2.0084321123161742e-06, "loss": 1.0733, "step": 19124 }, { "epoch": 0.58, "learning_rate": 2.008192956333943e-06, "loss": 1.0165, "step": 19125 }, { "epoch": 0.58, "learning_rate": 2.0079538050334783e-06, "loss": 1.1847, "step": 19126 }, { "epoch": 0.58, "learning_rate": 2.0077146584170565e-06, "loss": 1.0522, "step": 19127 }, { "epoch": 0.58, "learning_rate": 2.0074755164869537e-06, "loss": 1.1061, "step": 19128 }, { "epoch": 0.58, "learning_rate": 2.0072363792454472e-06, "loss": 0.9749, "step": 19129 }, { "epoch": 0.58, "learning_rate": 2.0069972466948126e-06, "loss": 1.087, "step": 19130 }, { "epoch": 0.58, "learning_rate": 2.006758118837327e-06, "loss": 1.2848, "step": 19131 }, { "epoch": 0.58, "learning_rate": 2.0065189956752667e-06, "loss": 1.1411, "step": 19132 }, { "epoch": 0.58, "learning_rate": 2.0062798772109073e-06, "loss": 1.0288, "step": 19133 }, { "epoch": 0.58, "learning_rate": 2.006040763446526e-06, "loss": 1.1562, "step": 19134 }, { "epoch": 0.58, "learning_rate": 2.0058016543844e-06, "loss": 1.0878, "step": 19135 }, { "epoch": 0.58, "learning_rate": 2.0055625500268025e-06, "loss": 1.0611, "step": 19136 }, { "epoch": 0.58, "learning_rate": 2.0053234503760117e-06, "loss": 1.1069, "step": 19137 }, { "epoch": 0.58, "learning_rate": 2.0050843554343036e-06, "loss": 1.0157, "step": 19138 }, { "epoch": 0.58, "learning_rate": 2.004845265203954e-06, "loss": 1.054, "step": 19139 }, { "epoch": 0.58, "learning_rate": 2.00460617968724e-06, "loss": 1.0494, "step": 19140 }, { "epoch": 0.58, "learning_rate": 2.0043670988864358e-06, "loss": 1.0402, "step": 19141 }, { "epoch": 0.58, "learning_rate": 2.0041280228038175e-06, "loss": 1.1089, "step": 19142 }, { "epoch": 0.58, "learning_rate": 2.003888951441662e-06, "loss": 1.0332, "step": 19143 }, { "epoch": 0.58, "learning_rate": 2.003649884802245e-06, "loss": 1.3183, "step": 19144 }, { "epoch": 0.58, "learning_rate": 2.003410822887842e-06, "loss": 1.1197, "step": 19145 }, { "epoch": 0.58, "learning_rate": 2.0031717657007284e-06, "loss": 1.0045, "step": 19146 }, { "epoch": 0.58, "learning_rate": 2.0029327132431805e-06, "loss": 1.0927, "step": 19147 }, { "epoch": 0.58, "learning_rate": 2.0026936655174746e-06, "loss": 1.1553, "step": 19148 }, { "epoch": 0.58, "learning_rate": 2.002454622525885e-06, "loss": 1.201, "step": 19149 }, { "epoch": 0.58, "learning_rate": 2.0022155842706874e-06, "loss": 1.0943, "step": 19150 }, { "epoch": 0.58, "learning_rate": 2.0019765507541574e-06, "loss": 1.0335, "step": 19151 }, { "epoch": 0.58, "learning_rate": 2.001737521978571e-06, "loss": 1.0638, "step": 19152 }, { "epoch": 0.58, "learning_rate": 2.0014984979462046e-06, "loss": 1.067, "step": 19153 }, { "epoch": 0.58, "learning_rate": 2.0012594786593313e-06, "loss": 1.0734, "step": 19154 }, { "epoch": 0.58, "learning_rate": 2.0010204641202275e-06, "loss": 1.1334, "step": 19155 }, { "epoch": 0.58, "learning_rate": 2.000781454331169e-06, "loss": 1.0693, "step": 19156 }, { "epoch": 0.58, "learning_rate": 2.0005424492944302e-06, "loss": 1.0848, "step": 19157 }, { "epoch": 0.58, "learning_rate": 2.000303449012287e-06, "loss": 1.0087, "step": 19158 }, { "epoch": 0.58, "learning_rate": 2.000064453487014e-06, "loss": 1.1306, "step": 19159 }, { "epoch": 0.58, "learning_rate": 1.999825462720887e-06, "loss": 1.1162, "step": 19160 }, { "epoch": 0.58, "learning_rate": 1.999586476716181e-06, "loss": 1.2264, "step": 19161 }, { "epoch": 0.58, "learning_rate": 1.9993474954751703e-06, "loss": 1.264, "step": 19162 }, { "epoch": 0.58, "learning_rate": 1.99910851900013e-06, "loss": 1.0817, "step": 19163 }, { "epoch": 0.58, "learning_rate": 1.9988695472933358e-06, "loss": 1.0912, "step": 19164 }, { "epoch": 0.58, "learning_rate": 1.998630580357062e-06, "loss": 1.1539, "step": 19165 }, { "epoch": 0.58, "learning_rate": 1.9983916181935844e-06, "loss": 1.1728, "step": 19166 }, { "epoch": 0.58, "learning_rate": 1.998152660805176e-06, "loss": 1.09, "step": 19167 }, { "epoch": 0.58, "learning_rate": 1.9979137081941126e-06, "loss": 1.0897, "step": 19168 }, { "epoch": 0.58, "learning_rate": 1.997674760362669e-06, "loss": 1.0696, "step": 19169 }, { "epoch": 0.58, "learning_rate": 1.9974358173131205e-06, "loss": 1.178, "step": 19170 }, { "epoch": 0.58, "learning_rate": 1.99719687904774e-06, "loss": 1.1415, "step": 19171 }, { "epoch": 0.58, "learning_rate": 1.9969579455688033e-06, "loss": 1.0464, "step": 19172 }, { "epoch": 0.58, "learning_rate": 1.9967190168785843e-06, "loss": 1.1711, "step": 19173 }, { "epoch": 0.58, "learning_rate": 1.9964800929793595e-06, "loss": 1.0828, "step": 19174 }, { "epoch": 0.58, "learning_rate": 1.9962411738734005e-06, "loss": 1.2354, "step": 19175 }, { "epoch": 0.58, "learning_rate": 1.996002259562983e-06, "loss": 1.2506, "step": 19176 }, { "epoch": 0.58, "learning_rate": 1.995763350050381e-06, "loss": 1.1813, "step": 19177 }, { "epoch": 0.58, "learning_rate": 1.995524445337869e-06, "loss": 1.217, "step": 19178 }, { "epoch": 0.58, "learning_rate": 1.995285545427722e-06, "loss": 1.0772, "step": 19179 }, { "epoch": 0.58, "learning_rate": 1.9950466503222134e-06, "loss": 1.1161, "step": 19180 }, { "epoch": 0.58, "learning_rate": 1.994807760023617e-06, "loss": 1.2218, "step": 19181 }, { "epoch": 0.58, "learning_rate": 1.9945688745342075e-06, "loss": 1.0626, "step": 19182 }, { "epoch": 0.58, "learning_rate": 1.9943299938562592e-06, "loss": 1.1035, "step": 19183 }, { "epoch": 0.58, "learning_rate": 1.994091117992046e-06, "loss": 1.0557, "step": 19184 }, { "epoch": 0.58, "learning_rate": 1.993852246943841e-06, "loss": 1.186, "step": 19185 }, { "epoch": 0.58, "learning_rate": 1.993613380713919e-06, "loss": 1.1887, "step": 19186 }, { "epoch": 0.58, "learning_rate": 1.9933745193045548e-06, "loss": 1.224, "step": 19187 }, { "epoch": 0.58, "learning_rate": 1.99313566271802e-06, "loss": 1.2134, "step": 19188 }, { "epoch": 0.58, "learning_rate": 1.99289681095659e-06, "loss": 1.2327, "step": 19189 }, { "epoch": 0.58, "learning_rate": 1.992657964022538e-06, "loss": 1.1564, "step": 19190 }, { "epoch": 0.58, "learning_rate": 1.992419121918137e-06, "loss": 1.1627, "step": 19191 }, { "epoch": 0.58, "learning_rate": 1.992180284645664e-06, "loss": 1.0706, "step": 19192 }, { "epoch": 0.58, "learning_rate": 1.991941452207388e-06, "loss": 1.2129, "step": 19193 }, { "epoch": 0.58, "learning_rate": 1.9917026246055846e-06, "loss": 1.0811, "step": 19194 }, { "epoch": 0.58, "learning_rate": 1.991463801842528e-06, "loss": 1.1755, "step": 19195 }, { "epoch": 0.58, "learning_rate": 1.9912249839204912e-06, "loss": 1.1648, "step": 19196 }, { "epoch": 0.58, "learning_rate": 1.9909861708417476e-06, "loss": 1.0927, "step": 19197 }, { "epoch": 0.58, "learning_rate": 1.99074736260857e-06, "loss": 1.1473, "step": 19198 }, { "epoch": 0.58, "learning_rate": 1.9905085592232322e-06, "loss": 1.0124, "step": 19199 }, { "epoch": 0.58, "learning_rate": 1.990269760688009e-06, "loss": 1.1304, "step": 19200 }, { "epoch": 0.58, "learning_rate": 1.9900309670051705e-06, "loss": 1.0781, "step": 19201 }, { "epoch": 0.58, "learning_rate": 1.989792178176992e-06, "loss": 1.1414, "step": 19202 }, { "epoch": 0.58, "learning_rate": 1.989553394205746e-06, "loss": 1.1399, "step": 19203 }, { "epoch": 0.58, "learning_rate": 1.9893146150937063e-06, "loss": 1.0226, "step": 19204 }, { "epoch": 0.58, "learning_rate": 1.9890758408431465e-06, "loss": 1.037, "step": 19205 }, { "epoch": 0.58, "learning_rate": 1.9888370714563375e-06, "loss": 1.2209, "step": 19206 }, { "epoch": 0.58, "learning_rate": 1.988598306935553e-06, "loss": 1.1451, "step": 19207 }, { "epoch": 0.58, "learning_rate": 1.9883595472830668e-06, "loss": 1.1203, "step": 19208 }, { "epoch": 0.58, "learning_rate": 1.9881207925011514e-06, "loss": 1.1616, "step": 19209 }, { "epoch": 0.58, "learning_rate": 1.9878820425920793e-06, "loss": 1.038, "step": 19210 }, { "epoch": 0.58, "learning_rate": 1.987643297558124e-06, "loss": 1.2908, "step": 19211 }, { "epoch": 0.58, "learning_rate": 1.9874045574015573e-06, "loss": 1.1122, "step": 19212 }, { "epoch": 0.58, "learning_rate": 1.9871658221246524e-06, "loss": 0.9954, "step": 19213 }, { "epoch": 0.58, "learning_rate": 1.9869270917296817e-06, "loss": 1.1641, "step": 19214 }, { "epoch": 0.58, "learning_rate": 1.986688366218918e-06, "loss": 1.1011, "step": 19215 }, { "epoch": 0.58, "learning_rate": 1.986449645594634e-06, "loss": 1.0773, "step": 19216 }, { "epoch": 0.58, "learning_rate": 1.9862109298591018e-06, "loss": 1.3063, "step": 19217 }, { "epoch": 0.58, "learning_rate": 1.985972219014595e-06, "loss": 1.0861, "step": 19218 }, { "epoch": 0.58, "learning_rate": 1.985733513063384e-06, "loss": 1.0589, "step": 19219 }, { "epoch": 0.58, "learning_rate": 1.985494812007743e-06, "loss": 1.087, "step": 19220 }, { "epoch": 0.58, "learning_rate": 1.985256115849943e-06, "loss": 1.1694, "step": 19221 }, { "epoch": 0.58, "learning_rate": 1.9850174245922583e-06, "loss": 1.0133, "step": 19222 }, { "epoch": 0.58, "learning_rate": 1.984778738236958e-06, "loss": 1.1085, "step": 19223 }, { "epoch": 0.58, "learning_rate": 1.9845400567863166e-06, "loss": 1.0986, "step": 19224 }, { "epoch": 0.58, "learning_rate": 1.984301380242605e-06, "loss": 1.1525, "step": 19225 }, { "epoch": 0.58, "learning_rate": 1.9840627086080973e-06, "loss": 1.1557, "step": 19226 }, { "epoch": 0.58, "learning_rate": 1.983824041885063e-06, "loss": 1.1131, "step": 19227 }, { "epoch": 0.58, "learning_rate": 1.983585380075775e-06, "loss": 1.0661, "step": 19228 }, { "epoch": 0.58, "learning_rate": 1.983346723182506e-06, "loss": 1.0975, "step": 19229 }, { "epoch": 0.58, "learning_rate": 1.983108071207527e-06, "loss": 1.1304, "step": 19230 }, { "epoch": 0.58, "learning_rate": 1.9828694241531115e-06, "loss": 1.0729, "step": 19231 }, { "epoch": 0.58, "learning_rate": 1.982630782021529e-06, "loss": 1.1505, "step": 19232 }, { "epoch": 0.58, "learning_rate": 1.982392144815052e-06, "loss": 1.1548, "step": 19233 }, { "epoch": 0.58, "learning_rate": 1.9821535125359527e-06, "loss": 1.1168, "step": 19234 }, { "epoch": 0.58, "learning_rate": 1.9819148851865037e-06, "loss": 1.1077, "step": 19235 }, { "epoch": 0.58, "learning_rate": 1.9816762627689743e-06, "loss": 1.1315, "step": 19236 }, { "epoch": 0.58, "learning_rate": 1.981437645285637e-06, "loss": 1.2462, "step": 19237 }, { "epoch": 0.58, "learning_rate": 1.981199032738764e-06, "loss": 1.2123, "step": 19238 }, { "epoch": 0.58, "learning_rate": 1.9809604251306265e-06, "loss": 1.1223, "step": 19239 }, { "epoch": 0.58, "learning_rate": 1.9807218224634957e-06, "loss": 1.1414, "step": 19240 }, { "epoch": 0.58, "learning_rate": 1.9804832247396428e-06, "loss": 1.0997, "step": 19241 }, { "epoch": 0.58, "learning_rate": 1.9802446319613395e-06, "loss": 1.0663, "step": 19242 }, { "epoch": 0.58, "learning_rate": 1.9800060441308564e-06, "loss": 1.0701, "step": 19243 }, { "epoch": 0.58, "learning_rate": 1.979767461250467e-06, "loss": 1.1888, "step": 19244 }, { "epoch": 0.58, "learning_rate": 1.9795288833224397e-06, "loss": 1.1038, "step": 19245 }, { "epoch": 0.58, "learning_rate": 1.9792903103490467e-06, "loss": 1.0555, "step": 19246 }, { "epoch": 0.58, "learning_rate": 1.979051742332559e-06, "loss": 1.0477, "step": 19247 }, { "epoch": 0.58, "learning_rate": 1.978813179275249e-06, "loss": 1.1994, "step": 19248 }, { "epoch": 0.58, "learning_rate": 1.9785746211793856e-06, "loss": 1.0889, "step": 19249 }, { "epoch": 0.58, "learning_rate": 1.9783360680472405e-06, "loss": 1.1715, "step": 19250 }, { "epoch": 0.58, "learning_rate": 1.9780975198810847e-06, "loss": 1.1231, "step": 19251 }, { "epoch": 0.58, "learning_rate": 1.97785897668319e-06, "loss": 1.1298, "step": 19252 }, { "epoch": 0.58, "learning_rate": 1.9776204384558254e-06, "loss": 1.0608, "step": 19253 }, { "epoch": 0.58, "learning_rate": 1.977381905201263e-06, "loss": 1.0604, "step": 19254 }, { "epoch": 0.58, "learning_rate": 1.977143376921773e-06, "loss": 1.2618, "step": 19255 }, { "epoch": 0.58, "learning_rate": 1.9769048536196264e-06, "loss": 1.1973, "step": 19256 }, { "epoch": 0.58, "learning_rate": 1.9766663352970947e-06, "loss": 1.1677, "step": 19257 }, { "epoch": 0.58, "learning_rate": 1.976427821956446e-06, "loss": 1.2311, "step": 19258 }, { "epoch": 0.58, "learning_rate": 1.9761893135999525e-06, "loss": 1.1167, "step": 19259 }, { "epoch": 0.58, "learning_rate": 1.9759508102298846e-06, "loss": 1.2598, "step": 19260 }, { "epoch": 0.58, "learning_rate": 1.975712311848514e-06, "loss": 1.19, "step": 19261 }, { "epoch": 0.58, "learning_rate": 1.975473818458108e-06, "loss": 1.2242, "step": 19262 }, { "epoch": 0.58, "learning_rate": 1.9752353300609387e-06, "loss": 1.2037, "step": 19263 }, { "epoch": 0.58, "learning_rate": 1.9749968466592766e-06, "loss": 1.1019, "step": 19264 }, { "epoch": 0.58, "learning_rate": 1.974758368255392e-06, "loss": 1.0045, "step": 19265 }, { "epoch": 0.58, "learning_rate": 1.9745198948515543e-06, "loss": 1.1835, "step": 19266 }, { "epoch": 0.58, "learning_rate": 1.974281426450034e-06, "loss": 1.1226, "step": 19267 }, { "epoch": 0.58, "learning_rate": 1.9740429630531015e-06, "loss": 1.169, "step": 19268 }, { "epoch": 0.58, "learning_rate": 1.9738045046630268e-06, "loss": 1.1434, "step": 19269 }, { "epoch": 0.58, "learning_rate": 1.9735660512820804e-06, "loss": 1.0993, "step": 19270 }, { "epoch": 0.58, "learning_rate": 1.973327602912531e-06, "loss": 1.0832, "step": 19271 }, { "epoch": 0.58, "learning_rate": 1.9730891595566493e-06, "loss": 1.156, "step": 19272 }, { "epoch": 0.58, "learning_rate": 1.9728507212167045e-06, "loss": 1.0635, "step": 19273 }, { "epoch": 0.58, "learning_rate": 1.9726122878949684e-06, "loss": 1.1046, "step": 19274 }, { "epoch": 0.58, "learning_rate": 1.972373859593708e-06, "loss": 1.0556, "step": 19275 }, { "epoch": 0.58, "learning_rate": 1.9721354363151944e-06, "loss": 1.1487, "step": 19276 }, { "epoch": 0.58, "learning_rate": 1.9718970180616976e-06, "loss": 1.0269, "step": 19277 }, { "epoch": 0.58, "learning_rate": 1.971658604835487e-06, "loss": 1.1036, "step": 19278 }, { "epoch": 0.58, "learning_rate": 1.9714201966388317e-06, "loss": 1.0652, "step": 19279 }, { "epoch": 0.58, "learning_rate": 1.971181793474001e-06, "loss": 1.1787, "step": 19280 }, { "epoch": 0.58, "learning_rate": 1.9709433953432656e-06, "loss": 1.1769, "step": 19281 }, { "epoch": 0.58, "learning_rate": 1.970705002248894e-06, "loss": 1.1165, "step": 19282 }, { "epoch": 0.58, "learning_rate": 1.970466614193157e-06, "loss": 1.0338, "step": 19283 }, { "epoch": 0.58, "learning_rate": 1.9702282311783214e-06, "loss": 1.0352, "step": 19284 }, { "epoch": 0.58, "learning_rate": 1.9699898532066584e-06, "loss": 1.2336, "step": 19285 }, { "epoch": 0.58, "learning_rate": 1.9697514802804365e-06, "loss": 1.0544, "step": 19286 }, { "epoch": 0.58, "learning_rate": 1.969513112401926e-06, "loss": 1.0859, "step": 19287 }, { "epoch": 0.58, "learning_rate": 1.969274749573395e-06, "loss": 1.1617, "step": 19288 }, { "epoch": 0.58, "learning_rate": 1.969036391797112e-06, "loss": 1.1258, "step": 19289 }, { "epoch": 0.58, "learning_rate": 1.968798039075347e-06, "loss": 1.1371, "step": 19290 }, { "epoch": 0.58, "learning_rate": 1.968559691410369e-06, "loss": 1.2101, "step": 19291 }, { "epoch": 0.58, "learning_rate": 1.968321348804447e-06, "loss": 1.3052, "step": 19292 }, { "epoch": 0.58, "learning_rate": 1.9680830112598487e-06, "loss": 1.1831, "step": 19293 }, { "epoch": 0.58, "learning_rate": 1.967844678778845e-06, "loss": 1.0886, "step": 19294 }, { "epoch": 0.58, "learning_rate": 1.9676063513637035e-06, "loss": 1.0647, "step": 19295 }, { "epoch": 0.58, "learning_rate": 1.9673680290166933e-06, "loss": 1.0784, "step": 19296 }, { "epoch": 0.58, "learning_rate": 1.9671297117400824e-06, "loss": 1.1127, "step": 19297 }, { "epoch": 0.58, "learning_rate": 1.96689139953614e-06, "loss": 1.2389, "step": 19298 }, { "epoch": 0.58, "learning_rate": 1.9666530924071347e-06, "loss": 1.1919, "step": 19299 }, { "epoch": 0.58, "learning_rate": 1.9664147903553363e-06, "loss": 1.0532, "step": 19300 }, { "epoch": 0.58, "learning_rate": 1.966176493383011e-06, "loss": 1.1436, "step": 19301 }, { "epoch": 0.58, "learning_rate": 1.965938201492428e-06, "loss": 1.1013, "step": 19302 }, { "epoch": 0.58, "learning_rate": 1.965699914685857e-06, "loss": 0.8794, "step": 19303 }, { "epoch": 0.58, "learning_rate": 1.9654616329655653e-06, "loss": 1.1348, "step": 19304 }, { "epoch": 0.58, "learning_rate": 1.9652233563338215e-06, "loss": 1.1776, "step": 19305 }, { "epoch": 0.58, "learning_rate": 1.9649850847928935e-06, "loss": 1.2546, "step": 19306 }, { "epoch": 0.58, "learning_rate": 1.9647468183450497e-06, "loss": 1.1332, "step": 19307 }, { "epoch": 0.58, "learning_rate": 1.964508556992559e-06, "loss": 1.1614, "step": 19308 }, { "epoch": 0.58, "learning_rate": 1.964270300737688e-06, "loss": 1.1113, "step": 19309 }, { "epoch": 0.58, "learning_rate": 1.964032049582706e-06, "loss": 1.1308, "step": 19310 }, { "epoch": 0.58, "learning_rate": 1.9637938035298807e-06, "loss": 1.1961, "step": 19311 }, { "epoch": 0.58, "learning_rate": 1.96355556258148e-06, "loss": 1.1263, "step": 19312 }, { "epoch": 0.58, "learning_rate": 1.963317326739774e-06, "loss": 1.1216, "step": 19313 }, { "epoch": 0.58, "learning_rate": 1.9630790960070264e-06, "loss": 1.0757, "step": 19314 }, { "epoch": 0.58, "learning_rate": 1.9628408703855075e-06, "loss": 1.102, "step": 19315 }, { "epoch": 0.58, "learning_rate": 1.962602649877485e-06, "loss": 1.1332, "step": 19316 }, { "epoch": 0.58, "learning_rate": 1.9623644344852275e-06, "loss": 1.0817, "step": 19317 }, { "epoch": 0.58, "learning_rate": 1.9621262242110006e-06, "loss": 1.1143, "step": 19318 }, { "epoch": 0.58, "learning_rate": 1.9618880190570727e-06, "loss": 1.0975, "step": 19319 }, { "epoch": 0.58, "learning_rate": 1.961649819025712e-06, "loss": 1.1751, "step": 19320 }, { "epoch": 0.58, "learning_rate": 1.9614116241191862e-06, "loss": 1.0565, "step": 19321 }, { "epoch": 0.58, "learning_rate": 1.961173434339762e-06, "loss": 1.108, "step": 19322 }, { "epoch": 0.58, "learning_rate": 1.9609352496897067e-06, "loss": 1.0588, "step": 19323 }, { "epoch": 0.58, "learning_rate": 1.9606970701712886e-06, "loss": 1.1664, "step": 19324 }, { "epoch": 0.58, "learning_rate": 1.9604588957867744e-06, "loss": 1.117, "step": 19325 }, { "epoch": 0.58, "learning_rate": 1.9602207265384333e-06, "loss": 1.0696, "step": 19326 }, { "epoch": 0.58, "learning_rate": 1.959982562428529e-06, "loss": 1.1782, "step": 19327 }, { "epoch": 0.58, "learning_rate": 1.9597444034593314e-06, "loss": 1.0157, "step": 19328 }, { "epoch": 0.58, "learning_rate": 1.9595062496331065e-06, "loss": 1.1954, "step": 19329 }, { "epoch": 0.58, "learning_rate": 1.959268100952123e-06, "loss": 1.2408, "step": 19330 }, { "epoch": 0.58, "learning_rate": 1.959029957418645e-06, "loss": 1.1799, "step": 19331 }, { "epoch": 0.58, "learning_rate": 1.958791819034942e-06, "loss": 1.1145, "step": 19332 }, { "epoch": 0.58, "learning_rate": 1.95855368580328e-06, "loss": 1.2191, "step": 19333 }, { "epoch": 0.58, "learning_rate": 1.958315557725927e-06, "loss": 1.058, "step": 19334 }, { "epoch": 0.58, "learning_rate": 1.958077434805148e-06, "loss": 1.1249, "step": 19335 }, { "epoch": 0.58, "learning_rate": 1.9578393170432113e-06, "loss": 1.1053, "step": 19336 }, { "epoch": 0.58, "learning_rate": 1.9576012044423827e-06, "loss": 1.1327, "step": 19337 }, { "epoch": 0.58, "learning_rate": 1.9573630970049297e-06, "loss": 1.1489, "step": 19338 }, { "epoch": 0.58, "learning_rate": 1.95712499473312e-06, "loss": 1.0358, "step": 19339 }, { "epoch": 0.58, "learning_rate": 1.9568868976292172e-06, "loss": 0.9841, "step": 19340 }, { "epoch": 0.58, "learning_rate": 1.95664880569549e-06, "loss": 1.0469, "step": 19341 }, { "epoch": 0.58, "learning_rate": 1.9564107189342042e-06, "loss": 1.1678, "step": 19342 }, { "epoch": 0.58, "learning_rate": 1.956172637347628e-06, "loss": 1.1382, "step": 19343 }, { "epoch": 0.58, "learning_rate": 1.9559345609380252e-06, "loss": 1.0612, "step": 19344 }, { "epoch": 0.58, "learning_rate": 1.955696489707663e-06, "loss": 1.0842, "step": 19345 }, { "epoch": 0.58, "learning_rate": 1.9554584236588085e-06, "loss": 1.1193, "step": 19346 }, { "epoch": 0.58, "learning_rate": 1.9552203627937278e-06, "loss": 1.0198, "step": 19347 }, { "epoch": 0.58, "learning_rate": 1.9549823071146864e-06, "loss": 0.9966, "step": 19348 }, { "epoch": 0.58, "learning_rate": 1.954744256623951e-06, "loss": 1.0408, "step": 19349 }, { "epoch": 0.58, "learning_rate": 1.9545062113237875e-06, "loss": 1.1708, "step": 19350 }, { "epoch": 0.58, "learning_rate": 1.9542681712164626e-06, "loss": 1.1335, "step": 19351 }, { "epoch": 0.58, "learning_rate": 1.9540301363042423e-06, "loss": 1.1194, "step": 19352 }, { "epoch": 0.58, "learning_rate": 1.9537921065893916e-06, "loss": 1.1095, "step": 19353 }, { "epoch": 0.58, "learning_rate": 1.9535540820741767e-06, "loss": 1.1451, "step": 19354 }, { "epoch": 0.58, "learning_rate": 1.953316062760864e-06, "loss": 1.1652, "step": 19355 }, { "epoch": 0.58, "learning_rate": 1.95307804865172e-06, "loss": 1.0046, "step": 19356 }, { "epoch": 0.58, "learning_rate": 1.952840039749008e-06, "loss": 1.0561, "step": 19357 }, { "epoch": 0.58, "learning_rate": 1.9526020360549965e-06, "loss": 1.0651, "step": 19358 }, { "epoch": 0.58, "learning_rate": 1.9523640375719493e-06, "loss": 1.0875, "step": 19359 }, { "epoch": 0.58, "learning_rate": 1.9521260443021328e-06, "loss": 1.2121, "step": 19360 }, { "epoch": 0.58, "learning_rate": 1.951888056247813e-06, "loss": 1.181, "step": 19361 }, { "epoch": 0.58, "learning_rate": 1.951650073411254e-06, "loss": 1.0995, "step": 19362 }, { "epoch": 0.58, "learning_rate": 1.9514120957947223e-06, "loss": 1.1238, "step": 19363 }, { "epoch": 0.58, "learning_rate": 1.9511741234004834e-06, "loss": 1.147, "step": 19364 }, { "epoch": 0.58, "learning_rate": 1.950936156230804e-06, "loss": 1.1674, "step": 19365 }, { "epoch": 0.58, "learning_rate": 1.9506981942879466e-06, "loss": 1.1227, "step": 19366 }, { "epoch": 0.58, "learning_rate": 1.9504602375741777e-06, "loss": 1.2324, "step": 19367 }, { "epoch": 0.58, "learning_rate": 1.9502222860917626e-06, "loss": 1.1616, "step": 19368 }, { "epoch": 0.58, "learning_rate": 1.949984339842968e-06, "loss": 1.0823, "step": 19369 }, { "epoch": 0.58, "learning_rate": 1.9497463988300564e-06, "loss": 1.1657, "step": 19370 }, { "epoch": 0.58, "learning_rate": 1.949508463055294e-06, "loss": 1.0966, "step": 19371 }, { "epoch": 0.58, "learning_rate": 1.9492705325209455e-06, "loss": 1.0773, "step": 19372 }, { "epoch": 0.58, "learning_rate": 1.949032607229277e-06, "loss": 1.1791, "step": 19373 }, { "epoch": 0.58, "learning_rate": 1.9487946871825527e-06, "loss": 1.0186, "step": 19374 }, { "epoch": 0.58, "learning_rate": 1.9485567723830374e-06, "loss": 1.0441, "step": 19375 }, { "epoch": 0.58, "learning_rate": 1.9483188628329964e-06, "loss": 1.1705, "step": 19376 }, { "epoch": 0.58, "learning_rate": 1.9480809585346936e-06, "loss": 1.0703, "step": 19377 }, { "epoch": 0.58, "learning_rate": 1.9478430594903946e-06, "loss": 1.1722, "step": 19378 }, { "epoch": 0.58, "learning_rate": 1.9476051657023633e-06, "loss": 1.0646, "step": 19379 }, { "epoch": 0.58, "learning_rate": 1.947367277172865e-06, "loss": 1.1785, "step": 19380 }, { "epoch": 0.58, "learning_rate": 1.947129393904164e-06, "loss": 1.1119, "step": 19381 }, { "epoch": 0.58, "learning_rate": 1.946891515898526e-06, "loss": 1.0492, "step": 19382 }, { "epoch": 0.58, "learning_rate": 1.946653643158213e-06, "loss": 1.151, "step": 19383 }, { "epoch": 0.58, "learning_rate": 1.946415775685491e-06, "loss": 0.9944, "step": 19384 }, { "epoch": 0.58, "learning_rate": 1.946177913482624e-06, "loss": 1.1252, "step": 19385 }, { "epoch": 0.58, "learning_rate": 1.945940056551878e-06, "loss": 1.0756, "step": 19386 }, { "epoch": 0.58, "learning_rate": 1.945702204895515e-06, "loss": 1.1226, "step": 19387 }, { "epoch": 0.58, "learning_rate": 1.9454643585157994e-06, "loss": 1.1027, "step": 19388 }, { "epoch": 0.58, "learning_rate": 1.945226517414996e-06, "loss": 1.0614, "step": 19389 }, { "epoch": 0.58, "learning_rate": 1.9449886815953696e-06, "loss": 1.1225, "step": 19390 }, { "epoch": 0.58, "learning_rate": 1.9447508510591836e-06, "loss": 1.02, "step": 19391 }, { "epoch": 0.58, "learning_rate": 1.9445130258087016e-06, "loss": 1.0995, "step": 19392 }, { "epoch": 0.58, "learning_rate": 1.9442752058461884e-06, "loss": 1.2045, "step": 19393 }, { "epoch": 0.58, "learning_rate": 1.9440373911739075e-06, "loss": 1.0282, "step": 19394 }, { "epoch": 0.58, "learning_rate": 1.943799581794124e-06, "loss": 1.0911, "step": 19395 }, { "epoch": 0.58, "learning_rate": 1.943561777709099e-06, "loss": 1.1207, "step": 19396 }, { "epoch": 0.58, "learning_rate": 1.9433239789210984e-06, "loss": 1.1873, "step": 19397 }, { "epoch": 0.58, "learning_rate": 1.943086185432385e-06, "loss": 1.0903, "step": 19398 }, { "epoch": 0.58, "learning_rate": 1.9428483972452245e-06, "loss": 1.1037, "step": 19399 }, { "epoch": 0.58, "learning_rate": 1.942610614361878e-06, "loss": 1.2117, "step": 19400 }, { "epoch": 0.58, "learning_rate": 1.942372836784609e-06, "loss": 1.0654, "step": 19401 }, { "epoch": 0.58, "learning_rate": 1.9421350645156827e-06, "loss": 1.0694, "step": 19402 }, { "epoch": 0.58, "learning_rate": 1.9418972975573623e-06, "loss": 1.1401, "step": 19403 }, { "epoch": 0.58, "learning_rate": 1.9416595359119104e-06, "loss": 1.0994, "step": 19404 }, { "epoch": 0.58, "learning_rate": 1.941421779581591e-06, "loss": 1.2101, "step": 19405 }, { "epoch": 0.58, "learning_rate": 1.9411840285686672e-06, "loss": 1.064, "step": 19406 }, { "epoch": 0.58, "learning_rate": 1.940946282875402e-06, "loss": 1.0235, "step": 19407 }, { "epoch": 0.58, "learning_rate": 1.94070854250406e-06, "loss": 1.0699, "step": 19408 }, { "epoch": 0.58, "learning_rate": 1.9404708074569027e-06, "loss": 1.0285, "step": 19409 }, { "epoch": 0.58, "learning_rate": 1.9402330777361937e-06, "loss": 1.1993, "step": 19410 }, { "epoch": 0.58, "learning_rate": 1.939995353344196e-06, "loss": 1.2581, "step": 19411 }, { "epoch": 0.58, "learning_rate": 1.939757634283174e-06, "loss": 1.1209, "step": 19412 }, { "epoch": 0.58, "learning_rate": 1.939519920555388e-06, "loss": 1.0943, "step": 19413 }, { "epoch": 0.58, "learning_rate": 1.939282212163103e-06, "loss": 1.2084, "step": 19414 }, { "epoch": 0.58, "learning_rate": 1.939044509108581e-06, "loss": 1.1085, "step": 19415 }, { "epoch": 0.58, "learning_rate": 1.9388068113940853e-06, "loss": 1.2152, "step": 19416 }, { "epoch": 0.58, "learning_rate": 1.9385691190218787e-06, "loss": 1.2124, "step": 19417 }, { "epoch": 0.58, "learning_rate": 1.938331431994224e-06, "loss": 1.2096, "step": 19418 }, { "epoch": 0.58, "learning_rate": 1.9380937503133824e-06, "loss": 1.086, "step": 19419 }, { "epoch": 0.59, "learning_rate": 1.9378560739816183e-06, "loss": 1.1349, "step": 19420 }, { "epoch": 0.59, "learning_rate": 1.9376184030011946e-06, "loss": 1.1152, "step": 19421 }, { "epoch": 0.59, "learning_rate": 1.937380737374372e-06, "loss": 1.1265, "step": 19422 }, { "epoch": 0.59, "learning_rate": 1.9371430771034133e-06, "loss": 0.9897, "step": 19423 }, { "epoch": 0.59, "learning_rate": 1.9369054221905816e-06, "loss": 1.22, "step": 19424 }, { "epoch": 0.59, "learning_rate": 1.9366677726381407e-06, "loss": 1.2001, "step": 19425 }, { "epoch": 0.59, "learning_rate": 1.9364301284483496e-06, "loss": 1.0883, "step": 19426 }, { "epoch": 0.59, "learning_rate": 1.9361924896234725e-06, "loss": 1.0895, "step": 19427 }, { "epoch": 0.59, "learning_rate": 1.935954856165771e-06, "loss": 1.0663, "step": 19428 }, { "epoch": 0.59, "learning_rate": 1.9357172280775084e-06, "loss": 1.1019, "step": 19429 }, { "epoch": 0.59, "learning_rate": 1.935479605360946e-06, "loss": 1.0463, "step": 19430 }, { "epoch": 0.59, "learning_rate": 1.9352419880183454e-06, "loss": 1.0972, "step": 19431 }, { "epoch": 0.59, "learning_rate": 1.935004376051969e-06, "loss": 1.1522, "step": 19432 }, { "epoch": 0.59, "learning_rate": 1.934766769464079e-06, "loss": 1.1053, "step": 19433 }, { "epoch": 0.59, "learning_rate": 1.934529168256938e-06, "loss": 1.1092, "step": 19434 }, { "epoch": 0.59, "learning_rate": 1.934291572432806e-06, "loss": 1.1727, "step": 19435 }, { "epoch": 0.59, "learning_rate": 1.934053981993946e-06, "loss": 1.1478, "step": 19436 }, { "epoch": 0.59, "learning_rate": 1.9338163969426195e-06, "loss": 1.149, "step": 19437 }, { "epoch": 0.59, "learning_rate": 1.933578817281089e-06, "loss": 1.1171, "step": 19438 }, { "epoch": 0.59, "learning_rate": 1.9333412430116145e-06, "loss": 1.0701, "step": 19439 }, { "epoch": 0.59, "learning_rate": 1.933103674136458e-06, "loss": 1.131, "step": 19440 }, { "epoch": 0.59, "learning_rate": 1.932866110657882e-06, "loss": 1.028, "step": 19441 }, { "epoch": 0.59, "learning_rate": 1.9326285525781476e-06, "loss": 1.2433, "step": 19442 }, { "epoch": 0.59, "learning_rate": 1.932390999899516e-06, "loss": 1.1921, "step": 19443 }, { "epoch": 0.59, "learning_rate": 1.932153452624249e-06, "loss": 1.1575, "step": 19444 }, { "epoch": 0.59, "learning_rate": 1.9319159107546072e-06, "loss": 1.0956, "step": 19445 }, { "epoch": 0.59, "learning_rate": 1.931678374292852e-06, "loss": 1.0804, "step": 19446 }, { "epoch": 0.59, "learning_rate": 1.9314408432412467e-06, "loss": 1.0624, "step": 19447 }, { "epoch": 0.59, "learning_rate": 1.9312033176020493e-06, "loss": 1.0521, "step": 19448 }, { "epoch": 0.59, "learning_rate": 1.9309657973775227e-06, "loss": 1.0797, "step": 19449 }, { "epoch": 0.59, "learning_rate": 1.930728282569927e-06, "loss": 1.0403, "step": 19450 }, { "epoch": 0.59, "learning_rate": 1.9304907731815254e-06, "loss": 1.0902, "step": 19451 }, { "epoch": 0.59, "learning_rate": 1.9302532692145765e-06, "loss": 1.12, "step": 19452 }, { "epoch": 0.59, "learning_rate": 1.9300157706713413e-06, "loss": 1.0583, "step": 19453 }, { "epoch": 0.59, "learning_rate": 1.929778277554082e-06, "loss": 1.0887, "step": 19454 }, { "epoch": 0.59, "learning_rate": 1.929540789865059e-06, "loss": 1.2184, "step": 19455 }, { "epoch": 0.59, "learning_rate": 1.9293033076065333e-06, "loss": 1.1268, "step": 19456 }, { "epoch": 0.59, "learning_rate": 1.9290658307807647e-06, "loss": 1.0297, "step": 19457 }, { "epoch": 0.59, "learning_rate": 1.928828359390015e-06, "loss": 1.1759, "step": 19458 }, { "epoch": 0.59, "learning_rate": 1.9285908934365438e-06, "loss": 1.0739, "step": 19459 }, { "epoch": 0.59, "learning_rate": 1.9283534329226125e-06, "loss": 1.176, "step": 19460 }, { "epoch": 0.59, "learning_rate": 1.928115977850481e-06, "loss": 1.0763, "step": 19461 }, { "epoch": 0.59, "learning_rate": 1.9278785282224095e-06, "loss": 1.1221, "step": 19462 }, { "epoch": 0.59, "learning_rate": 1.9276410840406588e-06, "loss": 1.1148, "step": 19463 }, { "epoch": 0.59, "learning_rate": 1.9274036453074907e-06, "loss": 1.1338, "step": 19464 }, { "epoch": 0.59, "learning_rate": 1.9271662120251626e-06, "loss": 1.1613, "step": 19465 }, { "epoch": 0.59, "learning_rate": 1.926928784195937e-06, "loss": 1.1156, "step": 19466 }, { "epoch": 0.59, "learning_rate": 1.926691361822073e-06, "loss": 1.1911, "step": 19467 }, { "epoch": 0.59, "learning_rate": 1.926453944905831e-06, "loss": 1.0789, "step": 19468 }, { "epoch": 0.59, "learning_rate": 1.926216533449472e-06, "loss": 1.1276, "step": 19469 }, { "epoch": 0.59, "learning_rate": 1.925979127455255e-06, "loss": 1.16, "step": 19470 }, { "epoch": 0.59, "learning_rate": 1.92574172692544e-06, "loss": 1.0975, "step": 19471 }, { "epoch": 0.59, "learning_rate": 1.925504331862287e-06, "loss": 1.1039, "step": 19472 }, { "epoch": 0.59, "learning_rate": 1.9252669422680564e-06, "loss": 1.1357, "step": 19473 }, { "epoch": 0.59, "learning_rate": 1.9250295581450074e-06, "loss": 1.1818, "step": 19474 }, { "epoch": 0.59, "learning_rate": 1.9247921794954002e-06, "loss": 1.0478, "step": 19475 }, { "epoch": 0.59, "learning_rate": 1.9245548063214942e-06, "loss": 1.1276, "step": 19476 }, { "epoch": 0.59, "learning_rate": 1.9243174386255507e-06, "loss": 1.1091, "step": 19477 }, { "epoch": 0.59, "learning_rate": 1.924080076409827e-06, "loss": 1.1063, "step": 19478 }, { "epoch": 0.59, "learning_rate": 1.923842719676583e-06, "loss": 1.0637, "step": 19479 }, { "epoch": 0.59, "learning_rate": 1.923605368428079e-06, "loss": 1.2628, "step": 19480 }, { "epoch": 0.59, "learning_rate": 1.923368022666574e-06, "loss": 1.1531, "step": 19481 }, { "epoch": 0.59, "learning_rate": 1.9231306823943294e-06, "loss": 1.151, "step": 19482 }, { "epoch": 0.59, "learning_rate": 1.9228933476136016e-06, "loss": 1.016, "step": 19483 }, { "epoch": 0.59, "learning_rate": 1.9226560183266508e-06, "loss": 1.0822, "step": 19484 }, { "epoch": 0.59, "learning_rate": 1.922418694535737e-06, "loss": 1.0596, "step": 19485 }, { "epoch": 0.59, "learning_rate": 1.92218137624312e-06, "loss": 1.1138, "step": 19486 }, { "epoch": 0.59, "learning_rate": 1.921944063451057e-06, "loss": 1.0381, "step": 19487 }, { "epoch": 0.59, "learning_rate": 1.921706756161808e-06, "loss": 1.0209, "step": 19488 }, { "epoch": 0.59, "learning_rate": 1.9214694543776324e-06, "loss": 1.0668, "step": 19489 }, { "epoch": 0.59, "learning_rate": 1.92123215810079e-06, "loss": 1.0333, "step": 19490 }, { "epoch": 0.59, "learning_rate": 1.920994867333538e-06, "loss": 1.1154, "step": 19491 }, { "epoch": 0.59, "learning_rate": 1.9207575820781354e-06, "loss": 1.2516, "step": 19492 }, { "epoch": 0.59, "learning_rate": 1.9205203023368415e-06, "loss": 1.1055, "step": 19493 }, { "epoch": 0.59, "learning_rate": 1.9202830281119167e-06, "loss": 1.1693, "step": 19494 }, { "epoch": 0.59, "learning_rate": 1.9200457594056173e-06, "loss": 1.163, "step": 19495 }, { "epoch": 0.59, "learning_rate": 1.9198084962202024e-06, "loss": 1.0671, "step": 19496 }, { "epoch": 0.59, "learning_rate": 1.919571238557932e-06, "loss": 1.1421, "step": 19497 }, { "epoch": 0.59, "learning_rate": 1.9193339864210633e-06, "loss": 1.1527, "step": 19498 }, { "epoch": 0.59, "learning_rate": 1.919096739811856e-06, "loss": 1.0843, "step": 19499 }, { "epoch": 0.59, "learning_rate": 1.9188594987325677e-06, "loss": 0.9818, "step": 19500 }, { "epoch": 0.59, "learning_rate": 1.918622263185457e-06, "loss": 1.1691, "step": 19501 }, { "epoch": 0.59, "learning_rate": 1.918385033172782e-06, "loss": 1.1395, "step": 19502 }, { "epoch": 0.59, "learning_rate": 1.918147808696803e-06, "loss": 1.1139, "step": 19503 }, { "epoch": 0.59, "learning_rate": 1.917910589759775e-06, "loss": 1.1429, "step": 19504 }, { "epoch": 0.59, "learning_rate": 1.917673376363958e-06, "loss": 1.1854, "step": 19505 }, { "epoch": 0.59, "learning_rate": 1.9174361685116104e-06, "loss": 1.1767, "step": 19506 }, { "epoch": 0.59, "learning_rate": 1.9171989662049908e-06, "loss": 1.1887, "step": 19507 }, { "epoch": 0.59, "learning_rate": 1.9169617694463548e-06, "loss": 1.1282, "step": 19508 }, { "epoch": 0.59, "learning_rate": 1.9167245782379627e-06, "loss": 0.9849, "step": 19509 }, { "epoch": 0.59, "learning_rate": 1.916487392582071e-06, "loss": 1.0698, "step": 19510 }, { "epoch": 0.59, "learning_rate": 1.9162502124809385e-06, "loss": 1.1589, "step": 19511 }, { "epoch": 0.59, "learning_rate": 1.9160130379368236e-06, "loss": 1.1102, "step": 19512 }, { "epoch": 0.59, "learning_rate": 1.915775868951983e-06, "loss": 1.0853, "step": 19513 }, { "epoch": 0.59, "learning_rate": 1.915538705528674e-06, "loss": 1.09, "step": 19514 }, { "epoch": 0.59, "learning_rate": 1.9153015476691555e-06, "loss": 1.0322, "step": 19515 }, { "epoch": 0.59, "learning_rate": 1.915064395375686e-06, "loss": 1.1738, "step": 19516 }, { "epoch": 0.59, "learning_rate": 1.91482724865052e-06, "loss": 1.0005, "step": 19517 }, { "epoch": 0.59, "learning_rate": 1.914590107495917e-06, "loss": 1.1238, "step": 19518 }, { "epoch": 0.59, "learning_rate": 1.9143529719141345e-06, "loss": 0.9287, "step": 19519 }, { "epoch": 0.59, "learning_rate": 1.914115841907431e-06, "loss": 1.0921, "step": 19520 }, { "epoch": 0.59, "learning_rate": 1.9138787174780605e-06, "loss": 1.0507, "step": 19521 }, { "epoch": 0.59, "learning_rate": 1.913641598628283e-06, "loss": 1.0956, "step": 19522 }, { "epoch": 0.59, "learning_rate": 1.913404485360355e-06, "loss": 1.046, "step": 19523 }, { "epoch": 0.59, "learning_rate": 1.9131673776765336e-06, "loss": 1.0999, "step": 19524 }, { "epoch": 0.59, "learning_rate": 1.9129302755790768e-06, "loss": 1.2418, "step": 19525 }, { "epoch": 0.59, "learning_rate": 1.912693179070241e-06, "loss": 1.1252, "step": 19526 }, { "epoch": 0.59, "learning_rate": 1.9124560881522824e-06, "loss": 1.1604, "step": 19527 }, { "epoch": 0.59, "learning_rate": 1.912219002827459e-06, "loss": 1.0048, "step": 19528 }, { "epoch": 0.59, "learning_rate": 1.911981923098029e-06, "loss": 1.1653, "step": 19529 }, { "epoch": 0.59, "learning_rate": 1.911744848966247e-06, "loss": 1.2767, "step": 19530 }, { "epoch": 0.59, "learning_rate": 1.9115077804343704e-06, "loss": 1.1478, "step": 19531 }, { "epoch": 0.59, "learning_rate": 1.9112707175046565e-06, "loss": 1.2031, "step": 19532 }, { "epoch": 0.59, "learning_rate": 1.9110336601793623e-06, "loss": 1.1711, "step": 19533 }, { "epoch": 0.59, "learning_rate": 1.910796608460744e-06, "loss": 1.1489, "step": 19534 }, { "epoch": 0.59, "learning_rate": 1.910559562351057e-06, "loss": 1.1149, "step": 19535 }, { "epoch": 0.59, "learning_rate": 1.9103225218525603e-06, "loss": 1.1853, "step": 19536 }, { "epoch": 0.59, "learning_rate": 1.910085486967508e-06, "loss": 1.1362, "step": 19537 }, { "epoch": 0.59, "learning_rate": 1.909848457698159e-06, "loss": 1.0706, "step": 19538 }, { "epoch": 0.59, "learning_rate": 1.9096114340467677e-06, "loss": 1.1063, "step": 19539 }, { "epoch": 0.59, "learning_rate": 1.909374416015591e-06, "loss": 1.1086, "step": 19540 }, { "epoch": 0.59, "learning_rate": 1.9091374036068867e-06, "loss": 0.9355, "step": 19541 }, { "epoch": 0.59, "learning_rate": 1.9089003968229092e-06, "loss": 1.0189, "step": 19542 }, { "epoch": 0.59, "learning_rate": 1.9086633956659148e-06, "loss": 1.3491, "step": 19543 }, { "epoch": 0.59, "learning_rate": 1.90842640013816e-06, "loss": 1.1982, "step": 19544 }, { "epoch": 0.59, "learning_rate": 1.908189410241901e-06, "loss": 1.1589, "step": 19545 }, { "epoch": 0.59, "learning_rate": 1.907952425979395e-06, "loss": 1.1916, "step": 19546 }, { "epoch": 0.59, "learning_rate": 1.9077154473528957e-06, "loss": 1.0587, "step": 19547 }, { "epoch": 0.59, "learning_rate": 1.90747847436466e-06, "loss": 1.0228, "step": 19548 }, { "epoch": 0.59, "learning_rate": 1.9072415070169437e-06, "loss": 1.1448, "step": 19549 }, { "epoch": 0.59, "learning_rate": 1.9070045453120029e-06, "loss": 1.1053, "step": 19550 }, { "epoch": 0.59, "learning_rate": 1.9067675892520937e-06, "loss": 1.1589, "step": 19551 }, { "epoch": 0.59, "learning_rate": 1.9065306388394713e-06, "loss": 1.0807, "step": 19552 }, { "epoch": 0.59, "learning_rate": 1.906293694076391e-06, "loss": 1.0323, "step": 19553 }, { "epoch": 0.59, "learning_rate": 1.9060567549651088e-06, "loss": 1.1472, "step": 19554 }, { "epoch": 0.59, "learning_rate": 1.9058198215078808e-06, "loss": 1.1555, "step": 19555 }, { "epoch": 0.59, "learning_rate": 1.9055828937069611e-06, "loss": 1.0985, "step": 19556 }, { "epoch": 0.59, "learning_rate": 1.9053459715646063e-06, "loss": 1.0642, "step": 19557 }, { "epoch": 0.59, "learning_rate": 1.9051090550830714e-06, "loss": 1.2386, "step": 19558 }, { "epoch": 0.59, "learning_rate": 1.9048721442646128e-06, "loss": 1.1193, "step": 19559 }, { "epoch": 0.59, "learning_rate": 1.9046352391114837e-06, "loss": 1.0595, "step": 19560 }, { "epoch": 0.59, "learning_rate": 1.9043983396259401e-06, "loss": 1.0552, "step": 19561 }, { "epoch": 0.59, "learning_rate": 1.9041614458102382e-06, "loss": 1.1922, "step": 19562 }, { "epoch": 0.59, "learning_rate": 1.9039245576666316e-06, "loss": 1.1762, "step": 19563 }, { "epoch": 0.59, "learning_rate": 1.9036876751973777e-06, "loss": 1.1094, "step": 19564 }, { "epoch": 0.59, "learning_rate": 1.9034507984047285e-06, "loss": 1.1566, "step": 19565 }, { "epoch": 0.59, "learning_rate": 1.9032139272909406e-06, "loss": 1.1206, "step": 19566 }, { "epoch": 0.59, "learning_rate": 1.9029770618582688e-06, "loss": 1.1199, "step": 19567 }, { "epoch": 0.59, "learning_rate": 1.902740202108968e-06, "loss": 1.0403, "step": 19568 }, { "epoch": 0.59, "learning_rate": 1.9025033480452926e-06, "loss": 1.1435, "step": 19569 }, { "epoch": 0.59, "learning_rate": 1.9022664996694975e-06, "loss": 1.2067, "step": 19570 }, { "epoch": 0.59, "learning_rate": 1.9020296569838376e-06, "loss": 1.1287, "step": 19571 }, { "epoch": 0.59, "learning_rate": 1.901792819990568e-06, "loss": 1.07, "step": 19572 }, { "epoch": 0.59, "learning_rate": 1.9015559886919418e-06, "loss": 1.0702, "step": 19573 }, { "epoch": 0.59, "learning_rate": 1.9013191630902144e-06, "loss": 1.244, "step": 19574 }, { "epoch": 0.59, "learning_rate": 1.9010823431876404e-06, "loss": 1.172, "step": 19575 }, { "epoch": 0.59, "learning_rate": 1.900845528986474e-06, "loss": 1.1443, "step": 19576 }, { "epoch": 0.59, "learning_rate": 1.9006087204889707e-06, "loss": 1.0334, "step": 19577 }, { "epoch": 0.59, "learning_rate": 1.9003719176973823e-06, "loss": 1.205, "step": 19578 }, { "epoch": 0.59, "learning_rate": 1.9001351206139646e-06, "loss": 1.0964, "step": 19579 }, { "epoch": 0.59, "learning_rate": 1.8998983292409718e-06, "loss": 1.1272, "step": 19580 }, { "epoch": 0.59, "learning_rate": 1.8996615435806582e-06, "loss": 1.0954, "step": 19581 }, { "epoch": 0.59, "learning_rate": 1.8994247636352772e-06, "loss": 1.0305, "step": 19582 }, { "epoch": 0.59, "learning_rate": 1.899187989407083e-06, "loss": 1.074, "step": 19583 }, { "epoch": 0.59, "learning_rate": 1.8989512208983301e-06, "loss": 1.046, "step": 19584 }, { "epoch": 0.59, "learning_rate": 1.8987144581112729e-06, "loss": 1.098, "step": 19585 }, { "epoch": 0.59, "learning_rate": 1.8984777010481636e-06, "loss": 1.0649, "step": 19586 }, { "epoch": 0.59, "learning_rate": 1.898240949711257e-06, "loss": 1.293, "step": 19587 }, { "epoch": 0.59, "learning_rate": 1.8980042041028064e-06, "loss": 0.9854, "step": 19588 }, { "epoch": 0.59, "learning_rate": 1.897767464225066e-06, "loss": 1.1302, "step": 19589 }, { "epoch": 0.59, "learning_rate": 1.8975307300802904e-06, "loss": 1.1688, "step": 19590 }, { "epoch": 0.59, "learning_rate": 1.8972940016707308e-06, "loss": 1.041, "step": 19591 }, { "epoch": 0.59, "learning_rate": 1.8970572789986422e-06, "loss": 1.1931, "step": 19592 }, { "epoch": 0.59, "learning_rate": 1.8968205620662778e-06, "loss": 1.0576, "step": 19593 }, { "epoch": 0.59, "learning_rate": 1.8965838508758918e-06, "loss": 1.0627, "step": 19594 }, { "epoch": 0.59, "learning_rate": 1.8963471454297366e-06, "loss": 1.0937, "step": 19595 }, { "epoch": 0.59, "learning_rate": 1.8961104457300656e-06, "loss": 1.0662, "step": 19596 }, { "epoch": 0.59, "learning_rate": 1.8958737517791323e-06, "loss": 1.0819, "step": 19597 }, { "epoch": 0.59, "learning_rate": 1.895637063579191e-06, "loss": 1.1344, "step": 19598 }, { "epoch": 0.59, "learning_rate": 1.8954003811324928e-06, "loss": 1.035, "step": 19599 }, { "epoch": 0.59, "learning_rate": 1.8951637044412918e-06, "loss": 1.1394, "step": 19600 }, { "epoch": 0.59, "learning_rate": 1.894927033507841e-06, "loss": 1.1358, "step": 19601 }, { "epoch": 0.59, "learning_rate": 1.8946903683343932e-06, "loss": 1.132, "step": 19602 }, { "epoch": 0.59, "learning_rate": 1.8944537089232028e-06, "loss": 1.0488, "step": 19603 }, { "epoch": 0.59, "learning_rate": 1.8942170552765204e-06, "loss": 1.1215, "step": 19604 }, { "epoch": 0.59, "learning_rate": 1.8939804073966e-06, "loss": 1.1038, "step": 19605 }, { "epoch": 0.59, "learning_rate": 1.893743765285694e-06, "loss": 0.9781, "step": 19606 }, { "epoch": 0.59, "learning_rate": 1.8935071289460564e-06, "loss": 1.0654, "step": 19607 }, { "epoch": 0.59, "learning_rate": 1.8932704983799378e-06, "loss": 1.0643, "step": 19608 }, { "epoch": 0.59, "learning_rate": 1.893033873589592e-06, "loss": 1.0832, "step": 19609 }, { "epoch": 0.59, "learning_rate": 1.8927972545772713e-06, "loss": 0.9361, "step": 19610 }, { "epoch": 0.59, "learning_rate": 1.8925606413452296e-06, "loss": 1.252, "step": 19611 }, { "epoch": 0.59, "learning_rate": 1.892324033895717e-06, "loss": 1.0685, "step": 19612 }, { "epoch": 0.59, "learning_rate": 1.8920874322309865e-06, "loss": 1.233, "step": 19613 }, { "epoch": 0.59, "learning_rate": 1.891850836353291e-06, "loss": 1.081, "step": 19614 }, { "epoch": 0.59, "learning_rate": 1.891614246264883e-06, "loss": 1.0978, "step": 19615 }, { "epoch": 0.59, "learning_rate": 1.8913776619680153e-06, "loss": 1.0942, "step": 19616 }, { "epoch": 0.59, "learning_rate": 1.891141083464938e-06, "loss": 1.0969, "step": 19617 }, { "epoch": 0.59, "learning_rate": 1.8909045107579044e-06, "loss": 1.2337, "step": 19618 }, { "epoch": 0.59, "learning_rate": 1.8906679438491662e-06, "loss": 1.2331, "step": 19619 }, { "epoch": 0.59, "learning_rate": 1.8904313827409764e-06, "loss": 1.1312, "step": 19620 }, { "epoch": 0.59, "learning_rate": 1.8901948274355857e-06, "loss": 1.1419, "step": 19621 }, { "epoch": 0.59, "learning_rate": 1.8899582779352468e-06, "loss": 1.1601, "step": 19622 }, { "epoch": 0.59, "learning_rate": 1.889721734242212e-06, "loss": 1.1049, "step": 19623 }, { "epoch": 0.59, "learning_rate": 1.8894851963587317e-06, "loss": 1.2327, "step": 19624 }, { "epoch": 0.59, "learning_rate": 1.8892486642870584e-06, "loss": 1.2535, "step": 19625 }, { "epoch": 0.59, "learning_rate": 1.8890121380294433e-06, "loss": 1.0549, "step": 19626 }, { "epoch": 0.59, "learning_rate": 1.8887756175881384e-06, "loss": 1.1262, "step": 19627 }, { "epoch": 0.59, "learning_rate": 1.8885391029653954e-06, "loss": 1.1169, "step": 19628 }, { "epoch": 0.59, "learning_rate": 1.8883025941634664e-06, "loss": 1.0634, "step": 19629 }, { "epoch": 0.59, "learning_rate": 1.8880660911846014e-06, "loss": 1.0013, "step": 19630 }, { "epoch": 0.59, "learning_rate": 1.8878295940310524e-06, "loss": 1.1596, "step": 19631 }, { "epoch": 0.59, "learning_rate": 1.8875931027050705e-06, "loss": 1.1145, "step": 19632 }, { "epoch": 0.59, "learning_rate": 1.8873566172089084e-06, "loss": 1.0744, "step": 19633 }, { "epoch": 0.59, "learning_rate": 1.8871201375448158e-06, "loss": 1.0867, "step": 19634 }, { "epoch": 0.59, "learning_rate": 1.8868836637150438e-06, "loss": 1.1445, "step": 19635 }, { "epoch": 0.59, "learning_rate": 1.8866471957218447e-06, "loss": 1.1194, "step": 19636 }, { "epoch": 0.59, "learning_rate": 1.8864107335674686e-06, "loss": 1.0845, "step": 19637 }, { "epoch": 0.59, "learning_rate": 1.8861742772541666e-06, "loss": 1.0851, "step": 19638 }, { "epoch": 0.59, "learning_rate": 1.8859378267841899e-06, "loss": 1.0481, "step": 19639 }, { "epoch": 0.59, "learning_rate": 1.8857013821597895e-06, "loss": 1.0588, "step": 19640 }, { "epoch": 0.59, "learning_rate": 1.8854649433832157e-06, "loss": 1.0801, "step": 19641 }, { "epoch": 0.59, "learning_rate": 1.8852285104567208e-06, "loss": 0.9926, "step": 19642 }, { "epoch": 0.59, "learning_rate": 1.8849920833825537e-06, "loss": 1.187, "step": 19643 }, { "epoch": 0.59, "learning_rate": 1.8847556621629654e-06, "loss": 1.1401, "step": 19644 }, { "epoch": 0.59, "learning_rate": 1.8845192468002071e-06, "loss": 1.2614, "step": 19645 }, { "epoch": 0.59, "learning_rate": 1.88428283729653e-06, "loss": 1.0724, "step": 19646 }, { "epoch": 0.59, "learning_rate": 1.8840464336541827e-06, "loss": 1.0887, "step": 19647 }, { "epoch": 0.59, "learning_rate": 1.883810035875417e-06, "loss": 1.054, "step": 19648 }, { "epoch": 0.59, "learning_rate": 1.8835736439624827e-06, "loss": 1.1656, "step": 19649 }, { "epoch": 0.59, "learning_rate": 1.883337257917631e-06, "loss": 1.1022, "step": 19650 }, { "epoch": 0.59, "learning_rate": 1.8831008777431112e-06, "loss": 1.2168, "step": 19651 }, { "epoch": 0.59, "learning_rate": 1.8828645034411738e-06, "loss": 1.1313, "step": 19652 }, { "epoch": 0.59, "learning_rate": 1.882628135014069e-06, "loss": 1.1539, "step": 19653 }, { "epoch": 0.59, "learning_rate": 1.8823917724640472e-06, "loss": 1.1874, "step": 19654 }, { "epoch": 0.59, "learning_rate": 1.8821554157933593e-06, "loss": 1.1442, "step": 19655 }, { "epoch": 0.59, "learning_rate": 1.8819190650042535e-06, "loss": 1.2347, "step": 19656 }, { "epoch": 0.59, "learning_rate": 1.8816827200989802e-06, "loss": 1.0172, "step": 19657 }, { "epoch": 0.59, "learning_rate": 1.8814463810797896e-06, "loss": 1.1323, "step": 19658 }, { "epoch": 0.59, "learning_rate": 1.8812100479489325e-06, "loss": 1.0709, "step": 19659 }, { "epoch": 0.59, "learning_rate": 1.880973720708657e-06, "loss": 1.146, "step": 19660 }, { "epoch": 0.59, "learning_rate": 1.8807373993612133e-06, "loss": 1.0819, "step": 19661 }, { "epoch": 0.59, "learning_rate": 1.8805010839088516e-06, "loss": 1.0202, "step": 19662 }, { "epoch": 0.59, "learning_rate": 1.8802647743538217e-06, "loss": 1.1405, "step": 19663 }, { "epoch": 0.59, "learning_rate": 1.8800284706983718e-06, "loss": 0.9635, "step": 19664 }, { "epoch": 0.59, "learning_rate": 1.8797921729447523e-06, "loss": 1.1586, "step": 19665 }, { "epoch": 0.59, "learning_rate": 1.879555881095213e-06, "loss": 1.1243, "step": 19666 }, { "epoch": 0.59, "learning_rate": 1.8793195951520026e-06, "loss": 1.085, "step": 19667 }, { "epoch": 0.59, "learning_rate": 1.8790833151173717e-06, "loss": 1.0505, "step": 19668 }, { "epoch": 0.59, "learning_rate": 1.8788470409935678e-06, "loss": 1.0986, "step": 19669 }, { "epoch": 0.59, "learning_rate": 1.8786107727828406e-06, "loss": 1.1491, "step": 19670 }, { "epoch": 0.59, "learning_rate": 1.8783745104874399e-06, "loss": 0.9993, "step": 19671 }, { "epoch": 0.59, "learning_rate": 1.8781382541096155e-06, "loss": 1.2036, "step": 19672 }, { "epoch": 0.59, "learning_rate": 1.8779020036516144e-06, "loss": 1.0214, "step": 19673 }, { "epoch": 0.59, "learning_rate": 1.8776657591156863e-06, "loss": 1.2056, "step": 19674 }, { "epoch": 0.59, "learning_rate": 1.8774295205040807e-06, "loss": 1.1766, "step": 19675 }, { "epoch": 0.59, "learning_rate": 1.8771932878190467e-06, "loss": 1.1346, "step": 19676 }, { "epoch": 0.59, "learning_rate": 1.876957061062832e-06, "loss": 1.0403, "step": 19677 }, { "epoch": 0.59, "learning_rate": 1.876720840237686e-06, "loss": 1.1088, "step": 19678 }, { "epoch": 0.59, "learning_rate": 1.8764846253458577e-06, "loss": 1.0572, "step": 19679 }, { "epoch": 0.59, "learning_rate": 1.8762484163895964e-06, "loss": 1.2189, "step": 19680 }, { "epoch": 0.59, "learning_rate": 1.8760122133711487e-06, "loss": 1.1682, "step": 19681 }, { "epoch": 0.59, "learning_rate": 1.8757760162927642e-06, "loss": 1.1721, "step": 19682 }, { "epoch": 0.59, "learning_rate": 1.8755398251566912e-06, "loss": 1.1529, "step": 19683 }, { "epoch": 0.59, "learning_rate": 1.8753036399651786e-06, "loss": 1.0263, "step": 19684 }, { "epoch": 0.59, "learning_rate": 1.8750674607204752e-06, "loss": 1.1675, "step": 19685 }, { "epoch": 0.59, "learning_rate": 1.8748312874248278e-06, "loss": 1.2009, "step": 19686 }, { "epoch": 0.59, "learning_rate": 1.8745951200804854e-06, "loss": 1.0191, "step": 19687 }, { "epoch": 0.59, "learning_rate": 1.8743589586896966e-06, "loss": 1.1996, "step": 19688 }, { "epoch": 0.59, "learning_rate": 1.8741228032547094e-06, "loss": 1.2251, "step": 19689 }, { "epoch": 0.59, "learning_rate": 1.8738866537777708e-06, "loss": 1.2396, "step": 19690 }, { "epoch": 0.59, "learning_rate": 1.8736505102611303e-06, "loss": 1.0828, "step": 19691 }, { "epoch": 0.59, "learning_rate": 1.8734143727070347e-06, "loss": 1.1356, "step": 19692 }, { "epoch": 0.59, "learning_rate": 1.873178241117734e-06, "loss": 1.0476, "step": 19693 }, { "epoch": 0.59, "learning_rate": 1.8729421154954735e-06, "loss": 1.0907, "step": 19694 }, { "epoch": 0.59, "learning_rate": 1.872705995842502e-06, "loss": 1.0605, "step": 19695 }, { "epoch": 0.59, "learning_rate": 1.872469882161067e-06, "loss": 1.1309, "step": 19696 }, { "epoch": 0.59, "learning_rate": 1.872233774453417e-06, "loss": 1.1427, "step": 19697 }, { "epoch": 0.59, "learning_rate": 1.8719976727217998e-06, "loss": 1.1412, "step": 19698 }, { "epoch": 0.59, "learning_rate": 1.8717615769684612e-06, "loss": 1.0518, "step": 19699 }, { "epoch": 0.59, "learning_rate": 1.87152548719565e-06, "loss": 1.2158, "step": 19700 }, { "epoch": 0.59, "learning_rate": 1.8712894034056133e-06, "loss": 1.0834, "step": 19701 }, { "epoch": 0.59, "learning_rate": 1.8710533256005997e-06, "loss": 1.1354, "step": 19702 }, { "epoch": 0.59, "learning_rate": 1.8708172537828545e-06, "loss": 1.0323, "step": 19703 }, { "epoch": 0.59, "learning_rate": 1.8705811879546262e-06, "loss": 1.0236, "step": 19704 }, { "epoch": 0.59, "learning_rate": 1.8703451281181623e-06, "loss": 1.1035, "step": 19705 }, { "epoch": 0.59, "learning_rate": 1.8701090742757096e-06, "loss": 1.0228, "step": 19706 }, { "epoch": 0.59, "learning_rate": 1.8698730264295146e-06, "loss": 1.0524, "step": 19707 }, { "epoch": 0.59, "learning_rate": 1.8696369845818252e-06, "loss": 1.1464, "step": 19708 }, { "epoch": 0.59, "learning_rate": 1.8694009487348878e-06, "loss": 1.1681, "step": 19709 }, { "epoch": 0.59, "learning_rate": 1.8691649188909493e-06, "loss": 1.1689, "step": 19710 }, { "epoch": 0.59, "learning_rate": 1.8689288950522589e-06, "loss": 1.0861, "step": 19711 }, { "epoch": 0.59, "learning_rate": 1.8686928772210596e-06, "loss": 1.1899, "step": 19712 }, { "epoch": 0.59, "learning_rate": 1.8684568653996004e-06, "loss": 1.052, "step": 19713 }, { "epoch": 0.59, "learning_rate": 1.8682208595901278e-06, "loss": 1.0875, "step": 19714 }, { "epoch": 0.59, "learning_rate": 1.8679848597948885e-06, "loss": 1.1494, "step": 19715 }, { "epoch": 0.59, "learning_rate": 1.8677488660161294e-06, "loss": 1.0391, "step": 19716 }, { "epoch": 0.59, "learning_rate": 1.8675128782560958e-06, "loss": 1.1182, "step": 19717 }, { "epoch": 0.59, "learning_rate": 1.8672768965170352e-06, "loss": 0.9877, "step": 19718 }, { "epoch": 0.59, "learning_rate": 1.8670409208011941e-06, "loss": 1.1202, "step": 19719 }, { "epoch": 0.59, "learning_rate": 1.8668049511108183e-06, "loss": 1.1036, "step": 19720 }, { "epoch": 0.59, "learning_rate": 1.866568987448154e-06, "loss": 1.1713, "step": 19721 }, { "epoch": 0.59, "learning_rate": 1.866333029815448e-06, "loss": 1.0742, "step": 19722 }, { "epoch": 0.59, "learning_rate": 1.8660970782149467e-06, "loss": 1.0635, "step": 19723 }, { "epoch": 0.59, "learning_rate": 1.8658611326488967e-06, "loss": 1.0978, "step": 19724 }, { "epoch": 0.59, "learning_rate": 1.8656251931195424e-06, "loss": 1.02, "step": 19725 }, { "epoch": 0.59, "learning_rate": 1.8653892596291306e-06, "loss": 1.1094, "step": 19726 }, { "epoch": 0.59, "learning_rate": 1.8651533321799075e-06, "loss": 1.0511, "step": 19727 }, { "epoch": 0.59, "learning_rate": 1.8649174107741197e-06, "loss": 1.0503, "step": 19728 }, { "epoch": 0.59, "learning_rate": 1.8646814954140115e-06, "loss": 1.0798, "step": 19729 }, { "epoch": 0.59, "learning_rate": 1.8644455861018295e-06, "loss": 1.1756, "step": 19730 }, { "epoch": 0.59, "learning_rate": 1.8642096828398192e-06, "loss": 1.1442, "step": 19731 }, { "epoch": 0.59, "learning_rate": 1.8639737856302276e-06, "loss": 1.1299, "step": 19732 }, { "epoch": 0.59, "learning_rate": 1.8637378944752982e-06, "loss": 1.0923, "step": 19733 }, { "epoch": 0.59, "learning_rate": 1.8635020093772776e-06, "loss": 0.9417, "step": 19734 }, { "epoch": 0.59, "learning_rate": 1.8632661303384117e-06, "loss": 1.2097, "step": 19735 }, { "epoch": 0.59, "learning_rate": 1.8630302573609455e-06, "loss": 1.165, "step": 19736 }, { "epoch": 0.59, "learning_rate": 1.8627943904471251e-06, "loss": 1.0358, "step": 19737 }, { "epoch": 0.59, "learning_rate": 1.8625585295991943e-06, "loss": 1.0024, "step": 19738 }, { "epoch": 0.59, "learning_rate": 1.8623226748193996e-06, "loss": 1.1334, "step": 19739 }, { "epoch": 0.59, "learning_rate": 1.8620868261099855e-06, "loss": 1.1582, "step": 19740 }, { "epoch": 0.59, "learning_rate": 1.861850983473199e-06, "loss": 1.0803, "step": 19741 }, { "epoch": 0.59, "learning_rate": 1.8616151469112827e-06, "loss": 1.2327, "step": 19742 }, { "epoch": 0.59, "learning_rate": 1.8613793164264826e-06, "loss": 1.1816, "step": 19743 }, { "epoch": 0.59, "learning_rate": 1.8611434920210442e-06, "loss": 1.1311, "step": 19744 }, { "epoch": 0.59, "learning_rate": 1.8609076736972121e-06, "loss": 1.0773, "step": 19745 }, { "epoch": 0.59, "learning_rate": 1.8606718614572308e-06, "loss": 1.0945, "step": 19746 }, { "epoch": 0.59, "learning_rate": 1.8604360553033456e-06, "loss": 1.1379, "step": 19747 }, { "epoch": 0.59, "learning_rate": 1.8602002552378009e-06, "loss": 1.3244, "step": 19748 }, { "epoch": 0.59, "learning_rate": 1.859964461262842e-06, "loss": 1.2075, "step": 19749 }, { "epoch": 0.59, "learning_rate": 1.859728673380714e-06, "loss": 1.189, "step": 19750 }, { "epoch": 0.59, "learning_rate": 1.8594928915936594e-06, "loss": 1.1244, "step": 19751 }, { "epoch": 0.6, "learning_rate": 1.859257115903924e-06, "loss": 1.0948, "step": 19752 }, { "epoch": 0.6, "learning_rate": 1.8590213463137527e-06, "loss": 1.042, "step": 19753 }, { "epoch": 0.6, "learning_rate": 1.8587855828253903e-06, "loss": 1.0693, "step": 19754 }, { "epoch": 0.6, "learning_rate": 1.8585498254410794e-06, "loss": 1.2063, "step": 19755 }, { "epoch": 0.6, "learning_rate": 1.8583140741630651e-06, "loss": 1.2446, "step": 19756 }, { "epoch": 0.6, "learning_rate": 1.8580783289935917e-06, "loss": 1.0886, "step": 19757 }, { "epoch": 0.6, "learning_rate": 1.857842589934904e-06, "loss": 1.1038, "step": 19758 }, { "epoch": 0.6, "learning_rate": 1.857606856989245e-06, "loss": 1.0103, "step": 19759 }, { "epoch": 0.6, "learning_rate": 1.8573711301588592e-06, "loss": 1.1086, "step": 19760 }, { "epoch": 0.6, "learning_rate": 1.8571354094459912e-06, "loss": 1.1223, "step": 19761 }, { "epoch": 0.6, "learning_rate": 1.8568996948528842e-06, "loss": 1.1328, "step": 19762 }, { "epoch": 0.6, "learning_rate": 1.8566639863817838e-06, "loss": 1.0945, "step": 19763 }, { "epoch": 0.6, "learning_rate": 1.8564282840349306e-06, "loss": 1.1261, "step": 19764 }, { "epoch": 0.6, "learning_rate": 1.8561925878145708e-06, "loss": 0.9662, "step": 19765 }, { "epoch": 0.6, "learning_rate": 1.8559568977229472e-06, "loss": 1.1016, "step": 19766 }, { "epoch": 0.6, "learning_rate": 1.855721213762305e-06, "loss": 1.1871, "step": 19767 }, { "epoch": 0.6, "learning_rate": 1.8554855359348855e-06, "loss": 1.1087, "step": 19768 }, { "epoch": 0.6, "learning_rate": 1.8552498642429332e-06, "loss": 1.2037, "step": 19769 }, { "epoch": 0.6, "learning_rate": 1.8550141986886916e-06, "loss": 1.0897, "step": 19770 }, { "epoch": 0.6, "learning_rate": 1.8547785392744048e-06, "loss": 1.1192, "step": 19771 }, { "epoch": 0.6, "learning_rate": 1.854542886002315e-06, "loss": 1.1369, "step": 19772 }, { "epoch": 0.6, "learning_rate": 1.854307238874666e-06, "loss": 1.1652, "step": 19773 }, { "epoch": 0.6, "learning_rate": 1.8540715978937012e-06, "loss": 1.072, "step": 19774 }, { "epoch": 0.6, "learning_rate": 1.8538359630616636e-06, "loss": 1.0978, "step": 19775 }, { "epoch": 0.6, "learning_rate": 1.8536003343807977e-06, "loss": 1.0897, "step": 19776 }, { "epoch": 0.6, "learning_rate": 1.853364711853344e-06, "loss": 1.0651, "step": 19777 }, { "epoch": 0.6, "learning_rate": 1.853129095481547e-06, "loss": 0.9971, "step": 19778 }, { "epoch": 0.6, "learning_rate": 1.8528934852676496e-06, "loss": 1.207, "step": 19779 }, { "epoch": 0.6, "learning_rate": 1.8526578812138952e-06, "loss": 1.2112, "step": 19780 }, { "epoch": 0.6, "learning_rate": 1.8524222833225252e-06, "loss": 1.1487, "step": 19781 }, { "epoch": 0.6, "learning_rate": 1.8521866915957832e-06, "loss": 1.2094, "step": 19782 }, { "epoch": 0.6, "learning_rate": 1.851951106035912e-06, "loss": 1.0262, "step": 19783 }, { "epoch": 0.6, "learning_rate": 1.8517155266451543e-06, "loss": 1.082, "step": 19784 }, { "epoch": 0.6, "learning_rate": 1.8514799534257522e-06, "loss": 1.1595, "step": 19785 }, { "epoch": 0.6, "learning_rate": 1.8512443863799487e-06, "loss": 1.2726, "step": 19786 }, { "epoch": 0.6, "learning_rate": 1.8510088255099868e-06, "loss": 1.179, "step": 19787 }, { "epoch": 0.6, "learning_rate": 1.8507732708181076e-06, "loss": 1.1151, "step": 19788 }, { "epoch": 0.6, "learning_rate": 1.8505377223065545e-06, "loss": 1.1166, "step": 19789 }, { "epoch": 0.6, "learning_rate": 1.8503021799775695e-06, "loss": 1.023, "step": 19790 }, { "epoch": 0.6, "learning_rate": 1.8500666438333945e-06, "loss": 1.074, "step": 19791 }, { "epoch": 0.6, "learning_rate": 1.849831113876272e-06, "loss": 1.0047, "step": 19792 }, { "epoch": 0.6, "learning_rate": 1.8495955901084456e-06, "loss": 1.1277, "step": 19793 }, { "epoch": 0.6, "learning_rate": 1.8493600725321544e-06, "loss": 1.2181, "step": 19794 }, { "epoch": 0.6, "learning_rate": 1.8491245611496422e-06, "loss": 1.064, "step": 19795 }, { "epoch": 0.6, "learning_rate": 1.8488890559631506e-06, "loss": 1.1323, "step": 19796 }, { "epoch": 0.6, "learning_rate": 1.8486535569749225e-06, "loss": 1.1722, "step": 19797 }, { "epoch": 0.6, "learning_rate": 1.8484180641871986e-06, "loss": 1.0954, "step": 19798 }, { "epoch": 0.6, "learning_rate": 1.84818257760222e-06, "loss": 1.2046, "step": 19799 }, { "epoch": 0.6, "learning_rate": 1.8479470972222297e-06, "loss": 1.2183, "step": 19800 }, { "epoch": 0.6, "learning_rate": 1.847711623049469e-06, "loss": 1.1359, "step": 19801 }, { "epoch": 0.6, "learning_rate": 1.84747615508618e-06, "loss": 1.2567, "step": 19802 }, { "epoch": 0.6, "learning_rate": 1.8472406933346032e-06, "loss": 1.1042, "step": 19803 }, { "epoch": 0.6, "learning_rate": 1.8470052377969804e-06, "loss": 1.1525, "step": 19804 }, { "epoch": 0.6, "learning_rate": 1.8467697884755537e-06, "loss": 1.0449, "step": 19805 }, { "epoch": 0.6, "learning_rate": 1.8465343453725649e-06, "loss": 1.222, "step": 19806 }, { "epoch": 0.6, "learning_rate": 1.8462989084902532e-06, "loss": 1.0964, "step": 19807 }, { "epoch": 0.6, "learning_rate": 1.8460634778308611e-06, "loss": 1.106, "step": 19808 }, { "epoch": 0.6, "learning_rate": 1.84582805339663e-06, "loss": 1.0836, "step": 19809 }, { "epoch": 0.6, "learning_rate": 1.8455926351898013e-06, "loss": 1.2059, "step": 19810 }, { "epoch": 0.6, "learning_rate": 1.8453572232126149e-06, "loss": 1.154, "step": 19811 }, { "epoch": 0.6, "learning_rate": 1.8451218174673125e-06, "loss": 1.0463, "step": 19812 }, { "epoch": 0.6, "learning_rate": 1.8448864179561347e-06, "loss": 0.9445, "step": 19813 }, { "epoch": 0.6, "learning_rate": 1.8446510246813227e-06, "loss": 1.0513, "step": 19814 }, { "epoch": 0.6, "learning_rate": 1.844415637645118e-06, "loss": 1.1002, "step": 19815 }, { "epoch": 0.6, "learning_rate": 1.8441802568497602e-06, "loss": 1.0986, "step": 19816 }, { "epoch": 0.6, "learning_rate": 1.8439448822974903e-06, "loss": 1.1066, "step": 19817 }, { "epoch": 0.6, "learning_rate": 1.8437095139905493e-06, "loss": 1.0417, "step": 19818 }, { "epoch": 0.6, "learning_rate": 1.8434741519311788e-06, "loss": 1.1701, "step": 19819 }, { "epoch": 0.6, "learning_rate": 1.8432387961216169e-06, "loss": 1.1854, "step": 19820 }, { "epoch": 0.6, "learning_rate": 1.8430034465641055e-06, "loss": 1.1019, "step": 19821 }, { "epoch": 0.6, "learning_rate": 1.8427681032608849e-06, "loss": 1.0452, "step": 19822 }, { "epoch": 0.6, "learning_rate": 1.8425327662141962e-06, "loss": 1.1967, "step": 19823 }, { "epoch": 0.6, "learning_rate": 1.8422974354262783e-06, "loss": 1.2016, "step": 19824 }, { "epoch": 0.6, "learning_rate": 1.8420621108993719e-06, "loss": 1.118, "step": 19825 }, { "epoch": 0.6, "learning_rate": 1.841826792635717e-06, "loss": 1.0986, "step": 19826 }, { "epoch": 0.6, "learning_rate": 1.8415914806375546e-06, "loss": 1.1247, "step": 19827 }, { "epoch": 0.6, "learning_rate": 1.8413561749071243e-06, "loss": 1.0417, "step": 19828 }, { "epoch": 0.6, "learning_rate": 1.8411208754466655e-06, "loss": 1.0687, "step": 19829 }, { "epoch": 0.6, "learning_rate": 1.8408855822584188e-06, "loss": 1.2295, "step": 19830 }, { "epoch": 0.6, "learning_rate": 1.840650295344624e-06, "loss": 1.1931, "step": 19831 }, { "epoch": 0.6, "learning_rate": 1.8404150147075218e-06, "loss": 1.0934, "step": 19832 }, { "epoch": 0.6, "learning_rate": 1.8401797403493498e-06, "loss": 1.1923, "step": 19833 }, { "epoch": 0.6, "learning_rate": 1.839944472272349e-06, "loss": 1.1019, "step": 19834 }, { "epoch": 0.6, "learning_rate": 1.839709210478759e-06, "loss": 1.193, "step": 19835 }, { "epoch": 0.6, "learning_rate": 1.8394739549708201e-06, "loss": 1.1839, "step": 19836 }, { "epoch": 0.6, "learning_rate": 1.8392387057507702e-06, "loss": 1.2446, "step": 19837 }, { "epoch": 0.6, "learning_rate": 1.8390034628208498e-06, "loss": 1.1224, "step": 19838 }, { "epoch": 0.6, "learning_rate": 1.8387682261832975e-06, "loss": 1.0116, "step": 19839 }, { "epoch": 0.6, "learning_rate": 1.8385329958403537e-06, "loss": 1.0789, "step": 19840 }, { "epoch": 0.6, "learning_rate": 1.8382977717942574e-06, "loss": 1.1144, "step": 19841 }, { "epoch": 0.6, "learning_rate": 1.8380625540472474e-06, "loss": 1.1519, "step": 19842 }, { "epoch": 0.6, "learning_rate": 1.837827342601563e-06, "loss": 1.2446, "step": 19843 }, { "epoch": 0.6, "learning_rate": 1.8375921374594433e-06, "loss": 1.1429, "step": 19844 }, { "epoch": 0.6, "learning_rate": 1.8373569386231285e-06, "loss": 1.1629, "step": 19845 }, { "epoch": 0.6, "learning_rate": 1.8371217460948555e-06, "loss": 1.1399, "step": 19846 }, { "epoch": 0.6, "learning_rate": 1.8368865598768642e-06, "loss": 1.0792, "step": 19847 }, { "epoch": 0.6, "learning_rate": 1.8366513799713937e-06, "loss": 1.1135, "step": 19848 }, { "epoch": 0.6, "learning_rate": 1.8364162063806833e-06, "loss": 1.1899, "step": 19849 }, { "epoch": 0.6, "learning_rate": 1.8361810391069701e-06, "loss": 1.1084, "step": 19850 }, { "epoch": 0.6, "learning_rate": 1.8359458781524935e-06, "loss": 1.0707, "step": 19851 }, { "epoch": 0.6, "learning_rate": 1.8357107235194926e-06, "loss": 1.1323, "step": 19852 }, { "epoch": 0.6, "learning_rate": 1.8354755752102057e-06, "loss": 0.9926, "step": 19853 }, { "epoch": 0.6, "learning_rate": 1.8352404332268717e-06, "loss": 1.1796, "step": 19854 }, { "epoch": 0.6, "learning_rate": 1.835005297571728e-06, "loss": 1.2086, "step": 19855 }, { "epoch": 0.6, "learning_rate": 1.8347701682470136e-06, "loss": 1.1851, "step": 19856 }, { "epoch": 0.6, "learning_rate": 1.834535045254967e-06, "loss": 1.1375, "step": 19857 }, { "epoch": 0.6, "learning_rate": 1.8342999285978275e-06, "loss": 1.1865, "step": 19858 }, { "epoch": 0.6, "learning_rate": 1.8340648182778306e-06, "loss": 1.0667, "step": 19859 }, { "epoch": 0.6, "learning_rate": 1.8338297142972162e-06, "loss": 1.1578, "step": 19860 }, { "epoch": 0.6, "learning_rate": 1.833594616658222e-06, "loss": 1.2303, "step": 19861 }, { "epoch": 0.6, "learning_rate": 1.833359525363087e-06, "loss": 1.1462, "step": 19862 }, { "epoch": 0.6, "learning_rate": 1.8331244404140469e-06, "loss": 1.1522, "step": 19863 }, { "epoch": 0.6, "learning_rate": 1.8328893618133415e-06, "loss": 1.1474, "step": 19864 }, { "epoch": 0.6, "learning_rate": 1.832654289563208e-06, "loss": 1.1276, "step": 19865 }, { "epoch": 0.6, "learning_rate": 1.8324192236658848e-06, "loss": 1.1496, "step": 19866 }, { "epoch": 0.6, "learning_rate": 1.8321841641236083e-06, "loss": 1.1887, "step": 19867 }, { "epoch": 0.6, "learning_rate": 1.831949110938617e-06, "loss": 1.1438, "step": 19868 }, { "epoch": 0.6, "learning_rate": 1.8317140641131487e-06, "loss": 1.0962, "step": 19869 }, { "epoch": 0.6, "learning_rate": 1.8314790236494407e-06, "loss": 1.0242, "step": 19870 }, { "epoch": 0.6, "learning_rate": 1.8312439895497309e-06, "loss": 1.069, "step": 19871 }, { "epoch": 0.6, "learning_rate": 1.8310089618162553e-06, "loss": 1.0868, "step": 19872 }, { "epoch": 0.6, "learning_rate": 1.8307739404512526e-06, "loss": 1.1796, "step": 19873 }, { "epoch": 0.6, "learning_rate": 1.8305389254569594e-06, "loss": 1.2183, "step": 19874 }, { "epoch": 0.6, "learning_rate": 1.8303039168356144e-06, "loss": 1.0625, "step": 19875 }, { "epoch": 0.6, "learning_rate": 1.8300689145894523e-06, "loss": 1.0726, "step": 19876 }, { "epoch": 0.6, "learning_rate": 1.8298339187207116e-06, "loss": 1.1098, "step": 19877 }, { "epoch": 0.6, "learning_rate": 1.8295989292316293e-06, "loss": 1.0068, "step": 19878 }, { "epoch": 0.6, "learning_rate": 1.8293639461244428e-06, "loss": 1.0712, "step": 19879 }, { "epoch": 0.6, "learning_rate": 1.829128969401388e-06, "loss": 1.1914, "step": 19880 }, { "epoch": 0.6, "learning_rate": 1.8288939990647028e-06, "loss": 1.2217, "step": 19881 }, { "epoch": 0.6, "learning_rate": 1.828659035116623e-06, "loss": 1.0304, "step": 19882 }, { "epoch": 0.6, "learning_rate": 1.828424077559386e-06, "loss": 1.0726, "step": 19883 }, { "epoch": 0.6, "learning_rate": 1.828189126395229e-06, "loss": 1.0176, "step": 19884 }, { "epoch": 0.6, "learning_rate": 1.8279541816263868e-06, "loss": 1.2953, "step": 19885 }, { "epoch": 0.6, "learning_rate": 1.8277192432550976e-06, "loss": 1.0952, "step": 19886 }, { "epoch": 0.6, "learning_rate": 1.8274843112835975e-06, "loss": 1.2147, "step": 19887 }, { "epoch": 0.6, "learning_rate": 1.827249385714124e-06, "loss": 1.1571, "step": 19888 }, { "epoch": 0.6, "learning_rate": 1.8270144665489108e-06, "loss": 0.9963, "step": 19889 }, { "epoch": 0.6, "learning_rate": 1.826779553790196e-06, "loss": 1.09, "step": 19890 }, { "epoch": 0.6, "learning_rate": 1.8265446474402154e-06, "loss": 1.0807, "step": 19891 }, { "epoch": 0.6, "learning_rate": 1.826309747501207e-06, "loss": 1.0657, "step": 19892 }, { "epoch": 0.6, "learning_rate": 1.8260748539754037e-06, "loss": 1.1951, "step": 19893 }, { "epoch": 0.6, "learning_rate": 1.8258399668650437e-06, "loss": 1.0937, "step": 19894 }, { "epoch": 0.6, "learning_rate": 1.8256050861723623e-06, "loss": 1.0955, "step": 19895 }, { "epoch": 0.6, "learning_rate": 1.8253702118995955e-06, "loss": 1.165, "step": 19896 }, { "epoch": 0.6, "learning_rate": 1.8251353440489803e-06, "loss": 1.1974, "step": 19897 }, { "epoch": 0.6, "learning_rate": 1.8249004826227506e-06, "loss": 1.1481, "step": 19898 }, { "epoch": 0.6, "learning_rate": 1.8246656276231437e-06, "loss": 1.0814, "step": 19899 }, { "epoch": 0.6, "learning_rate": 1.8244307790523943e-06, "loss": 1.032, "step": 19900 }, { "epoch": 0.6, "learning_rate": 1.82419593691274e-06, "loss": 1.1415, "step": 19901 }, { "epoch": 0.6, "learning_rate": 1.8239611012064135e-06, "loss": 1.0507, "step": 19902 }, { "epoch": 0.6, "learning_rate": 1.823726271935652e-06, "loss": 1.0953, "step": 19903 }, { "epoch": 0.6, "learning_rate": 1.8234914491026902e-06, "loss": 1.1796, "step": 19904 }, { "epoch": 0.6, "learning_rate": 1.8232566327097655e-06, "loss": 1.1277, "step": 19905 }, { "epoch": 0.6, "learning_rate": 1.8230218227591106e-06, "loss": 1.1268, "step": 19906 }, { "epoch": 0.6, "learning_rate": 1.8227870192529617e-06, "loss": 1.101, "step": 19907 }, { "epoch": 0.6, "learning_rate": 1.8225522221935547e-06, "loss": 1.1666, "step": 19908 }, { "epoch": 0.6, "learning_rate": 1.8223174315831239e-06, "loss": 1.0615, "step": 19909 }, { "epoch": 0.6, "learning_rate": 1.822082647423905e-06, "loss": 1.0641, "step": 19910 }, { "epoch": 0.6, "learning_rate": 1.821847869718133e-06, "loss": 1.233, "step": 19911 }, { "epoch": 0.6, "learning_rate": 1.8216130984680422e-06, "loss": 1.1423, "step": 19912 }, { "epoch": 0.6, "learning_rate": 1.8213783336758678e-06, "loss": 1.1627, "step": 19913 }, { "epoch": 0.6, "learning_rate": 1.8211435753438465e-06, "loss": 1.121, "step": 19914 }, { "epoch": 0.6, "learning_rate": 1.82090882347421e-06, "loss": 1.054, "step": 19915 }, { "epoch": 0.6, "learning_rate": 1.8206740780691945e-06, "loss": 1.123, "step": 19916 }, { "epoch": 0.6, "learning_rate": 1.8204393391310344e-06, "loss": 1.1771, "step": 19917 }, { "epoch": 0.6, "learning_rate": 1.8202046066619655e-06, "loss": 1.1347, "step": 19918 }, { "epoch": 0.6, "learning_rate": 1.8199698806642207e-06, "loss": 1.1284, "step": 19919 }, { "epoch": 0.6, "learning_rate": 1.819735161140035e-06, "loss": 1.2062, "step": 19920 }, { "epoch": 0.6, "learning_rate": 1.8195004480916429e-06, "loss": 1.0996, "step": 19921 }, { "epoch": 0.6, "learning_rate": 1.8192657415212787e-06, "loss": 1.1387, "step": 19922 }, { "epoch": 0.6, "learning_rate": 1.8190310414311774e-06, "loss": 1.0894, "step": 19923 }, { "epoch": 0.6, "learning_rate": 1.818796347823572e-06, "loss": 1.0775, "step": 19924 }, { "epoch": 0.6, "learning_rate": 1.8185616607006973e-06, "loss": 1.1882, "step": 19925 }, { "epoch": 0.6, "learning_rate": 1.8183269800647873e-06, "loss": 1.1122, "step": 19926 }, { "epoch": 0.6, "learning_rate": 1.8180923059180774e-06, "loss": 1.0231, "step": 19927 }, { "epoch": 0.6, "learning_rate": 1.8178576382627994e-06, "loss": 1.1058, "step": 19928 }, { "epoch": 0.6, "learning_rate": 1.8176229771011878e-06, "loss": 1.0843, "step": 19929 }, { "epoch": 0.6, "learning_rate": 1.8173883224354772e-06, "loss": 1.1053, "step": 19930 }, { "epoch": 0.6, "learning_rate": 1.817153674267902e-06, "loss": 1.1666, "step": 19931 }, { "epoch": 0.6, "learning_rate": 1.8169190326006937e-06, "loss": 1.1081, "step": 19932 }, { "epoch": 0.6, "learning_rate": 1.816684397436087e-06, "loss": 1.0461, "step": 19933 }, { "epoch": 0.6, "learning_rate": 1.816449768776316e-06, "loss": 1.0635, "step": 19934 }, { "epoch": 0.6, "learning_rate": 1.8162151466236138e-06, "loss": 1.0917, "step": 19935 }, { "epoch": 0.6, "learning_rate": 1.815980530980215e-06, "loss": 1.0925, "step": 19936 }, { "epoch": 0.6, "learning_rate": 1.8157459218483514e-06, "loss": 1.2339, "step": 19937 }, { "epoch": 0.6, "learning_rate": 1.8155113192302571e-06, "loss": 1.1699, "step": 19938 }, { "epoch": 0.6, "learning_rate": 1.8152767231281654e-06, "loss": 1.1711, "step": 19939 }, { "epoch": 0.6, "learning_rate": 1.8150421335443106e-06, "loss": 1.0911, "step": 19940 }, { "epoch": 0.6, "learning_rate": 1.8148075504809238e-06, "loss": 1.114, "step": 19941 }, { "epoch": 0.6, "learning_rate": 1.814572973940239e-06, "loss": 1.1096, "step": 19942 }, { "epoch": 0.6, "learning_rate": 1.8143384039244892e-06, "loss": 1.116, "step": 19943 }, { "epoch": 0.6, "learning_rate": 1.814103840435909e-06, "loss": 1.1222, "step": 19944 }, { "epoch": 0.6, "learning_rate": 1.8138692834767285e-06, "loss": 0.9872, "step": 19945 }, { "epoch": 0.6, "learning_rate": 1.8136347330491821e-06, "loss": 1.0497, "step": 19946 }, { "epoch": 0.6, "learning_rate": 1.8134001891555026e-06, "loss": 1.1102, "step": 19947 }, { "epoch": 0.6, "learning_rate": 1.8131656517979223e-06, "loss": 0.9819, "step": 19948 }, { "epoch": 0.6, "learning_rate": 1.8129311209786748e-06, "loss": 1.1503, "step": 19949 }, { "epoch": 0.6, "learning_rate": 1.812696596699992e-06, "loss": 1.0425, "step": 19950 }, { "epoch": 0.6, "learning_rate": 1.8124620789641061e-06, "loss": 1.1026, "step": 19951 }, { "epoch": 0.6, "learning_rate": 1.812227567773251e-06, "loss": 1.1876, "step": 19952 }, { "epoch": 0.6, "learning_rate": 1.8119930631296582e-06, "loss": 1.0204, "step": 19953 }, { "epoch": 0.6, "learning_rate": 1.8117585650355594e-06, "loss": 1.0471, "step": 19954 }, { "epoch": 0.6, "learning_rate": 1.8115240734931874e-06, "loss": 1.1448, "step": 19955 }, { "epoch": 0.6, "learning_rate": 1.811289588504775e-06, "loss": 0.9832, "step": 19956 }, { "epoch": 0.6, "learning_rate": 1.8110551100725548e-06, "loss": 1.1405, "step": 19957 }, { "epoch": 0.6, "learning_rate": 1.8108206381987573e-06, "loss": 1.15, "step": 19958 }, { "epoch": 0.6, "learning_rate": 1.8105861728856152e-06, "loss": 1.0006, "step": 19959 }, { "epoch": 0.6, "learning_rate": 1.8103517141353608e-06, "loss": 0.9826, "step": 19960 }, { "epoch": 0.6, "learning_rate": 1.810117261950226e-06, "loss": 1.2191, "step": 19961 }, { "epoch": 0.6, "learning_rate": 1.809882816332443e-06, "loss": 1.1671, "step": 19962 }, { "epoch": 0.6, "learning_rate": 1.8096483772842433e-06, "loss": 1.1222, "step": 19963 }, { "epoch": 0.6, "learning_rate": 1.8094139448078578e-06, "loss": 1.0743, "step": 19964 }, { "epoch": 0.6, "learning_rate": 1.8091795189055195e-06, "loss": 1.0598, "step": 19965 }, { "epoch": 0.6, "learning_rate": 1.8089450995794594e-06, "loss": 1.0972, "step": 19966 }, { "epoch": 0.6, "learning_rate": 1.8087106868319091e-06, "loss": 1.2065, "step": 19967 }, { "epoch": 0.6, "learning_rate": 1.8084762806650999e-06, "loss": 1.0562, "step": 19968 }, { "epoch": 0.6, "learning_rate": 1.8082418810812636e-06, "loss": 1.202, "step": 19969 }, { "epoch": 0.6, "learning_rate": 1.808007488082632e-06, "loss": 1.2052, "step": 19970 }, { "epoch": 0.6, "learning_rate": 1.8077731016714354e-06, "loss": 1.12, "step": 19971 }, { "epoch": 0.6, "learning_rate": 1.8075387218499053e-06, "loss": 1.1133, "step": 19972 }, { "epoch": 0.6, "learning_rate": 1.8073043486202728e-06, "loss": 1.0619, "step": 19973 }, { "epoch": 0.6, "learning_rate": 1.8070699819847693e-06, "loss": 1.0869, "step": 19974 }, { "epoch": 0.6, "learning_rate": 1.8068356219456273e-06, "loss": 1.2502, "step": 19975 }, { "epoch": 0.6, "learning_rate": 1.8066012685050749e-06, "loss": 1.1232, "step": 19976 }, { "epoch": 0.6, "learning_rate": 1.8063669216653445e-06, "loss": 1.0923, "step": 19977 }, { "epoch": 0.6, "learning_rate": 1.8061325814286674e-06, "loss": 1.0808, "step": 19978 }, { "epoch": 0.6, "learning_rate": 1.8058982477972742e-06, "loss": 1.1892, "step": 19979 }, { "epoch": 0.6, "learning_rate": 1.8056639207733946e-06, "loss": 1.0878, "step": 19980 }, { "epoch": 0.6, "learning_rate": 1.8054296003592603e-06, "loss": 1.1274, "step": 19981 }, { "epoch": 0.6, "learning_rate": 1.8051952865571016e-06, "loss": 1.1678, "step": 19982 }, { "epoch": 0.6, "learning_rate": 1.8049609793691502e-06, "loss": 1.0356, "step": 19983 }, { "epoch": 0.6, "learning_rate": 1.8047266787976347e-06, "loss": 0.9158, "step": 19984 }, { "epoch": 0.6, "learning_rate": 1.804492384844786e-06, "loss": 1.191, "step": 19985 }, { "epoch": 0.6, "learning_rate": 1.8042580975128352e-06, "loss": 1.0986, "step": 19986 }, { "epoch": 0.6, "learning_rate": 1.804023816804012e-06, "loss": 1.1691, "step": 19987 }, { "epoch": 0.6, "learning_rate": 1.8037895427205478e-06, "loss": 1.1005, "step": 19988 }, { "epoch": 0.6, "learning_rate": 1.8035552752646712e-06, "loss": 1.0938, "step": 19989 }, { "epoch": 0.6, "learning_rate": 1.8033210144386127e-06, "loss": 1.1456, "step": 19990 }, { "epoch": 0.6, "learning_rate": 1.8030867602446026e-06, "loss": 1.1761, "step": 19991 }, { "epoch": 0.6, "learning_rate": 1.8028525126848715e-06, "loss": 1.1002, "step": 19992 }, { "epoch": 0.6, "learning_rate": 1.802618271761648e-06, "loss": 1.1376, "step": 19993 }, { "epoch": 0.6, "learning_rate": 1.8023840374771628e-06, "loss": 1.1728, "step": 19994 }, { "epoch": 0.6, "learning_rate": 1.802149809833646e-06, "loss": 1.1602, "step": 19995 }, { "epoch": 0.6, "learning_rate": 1.8019155888333274e-06, "loss": 1.0687, "step": 19996 }, { "epoch": 0.6, "learning_rate": 1.8016813744784354e-06, "loss": 1.1523, "step": 19997 }, { "epoch": 0.6, "learning_rate": 1.8014471667712002e-06, "loss": 1.025, "step": 19998 }, { "epoch": 0.6, "learning_rate": 1.8012129657138516e-06, "loss": 1.2533, "step": 19999 }, { "epoch": 0.6, "learning_rate": 1.8009787713086192e-06, "loss": 1.1213, "step": 20000 }, { "epoch": 0.6, "learning_rate": 1.800744583557733e-06, "loss": 1.1194, "step": 20001 }, { "epoch": 0.6, "learning_rate": 1.8005104024634206e-06, "loss": 1.0847, "step": 20002 }, { "epoch": 0.6, "learning_rate": 1.8002762280279126e-06, "loss": 1.1537, "step": 20003 }, { "epoch": 0.6, "learning_rate": 1.8000420602534378e-06, "loss": 1.1457, "step": 20004 }, { "epoch": 0.6, "learning_rate": 1.7998078991422258e-06, "loss": 1.2397, "step": 20005 }, { "epoch": 0.6, "learning_rate": 1.799573744696505e-06, "loss": 1.147, "step": 20006 }, { "epoch": 0.6, "learning_rate": 1.7993395969185047e-06, "loss": 1.0157, "step": 20007 }, { "epoch": 0.6, "learning_rate": 1.7991054558104539e-06, "loss": 1.0848, "step": 20008 }, { "epoch": 0.6, "learning_rate": 1.7988713213745828e-06, "loss": 0.9249, "step": 20009 }, { "epoch": 0.6, "learning_rate": 1.798637193613118e-06, "loss": 1.3066, "step": 20010 }, { "epoch": 0.6, "learning_rate": 1.7984030725282895e-06, "loss": 1.0892, "step": 20011 }, { "epoch": 0.6, "learning_rate": 1.7981689581223256e-06, "loss": 1.1514, "step": 20012 }, { "epoch": 0.6, "learning_rate": 1.7979348503974554e-06, "loss": 1.1121, "step": 20013 }, { "epoch": 0.6, "learning_rate": 1.7977007493559082e-06, "loss": 1.1228, "step": 20014 }, { "epoch": 0.6, "learning_rate": 1.7974666549999104e-06, "loss": 1.0558, "step": 20015 }, { "epoch": 0.6, "learning_rate": 1.797232567331692e-06, "loss": 1.0118, "step": 20016 }, { "epoch": 0.6, "learning_rate": 1.7969984863534812e-06, "loss": 1.0948, "step": 20017 }, { "epoch": 0.6, "learning_rate": 1.7967644120675066e-06, "loss": 1.3743, "step": 20018 }, { "epoch": 0.6, "learning_rate": 1.796530344475995e-06, "loss": 1.0497, "step": 20019 }, { "epoch": 0.6, "learning_rate": 1.7962962835811764e-06, "loss": 1.1454, "step": 20020 }, { "epoch": 0.6, "learning_rate": 1.7960622293852782e-06, "loss": 1.1245, "step": 20021 }, { "epoch": 0.6, "learning_rate": 1.7958281818905297e-06, "loss": 1.0529, "step": 20022 }, { "epoch": 0.6, "learning_rate": 1.7955941410991563e-06, "loss": 1.2496, "step": 20023 }, { "epoch": 0.6, "learning_rate": 1.7953601070133878e-06, "loss": 1.2384, "step": 20024 }, { "epoch": 0.6, "learning_rate": 1.7951260796354513e-06, "loss": 0.9192, "step": 20025 }, { "epoch": 0.6, "learning_rate": 1.7948920589675756e-06, "loss": 1.0106, "step": 20026 }, { "epoch": 0.6, "learning_rate": 1.7946580450119886e-06, "loss": 1.2045, "step": 20027 }, { "epoch": 0.6, "learning_rate": 1.7944240377709162e-06, "loss": 1.2542, "step": 20028 }, { "epoch": 0.6, "learning_rate": 1.7941900372465873e-06, "loss": 1.1675, "step": 20029 }, { "epoch": 0.6, "learning_rate": 1.7939560434412296e-06, "loss": 1.0825, "step": 20030 }, { "epoch": 0.6, "learning_rate": 1.7937220563570702e-06, "loss": 0.9799, "step": 20031 }, { "epoch": 0.6, "learning_rate": 1.7934880759963364e-06, "loss": 1.1329, "step": 20032 }, { "epoch": 0.6, "learning_rate": 1.793254102361256e-06, "loss": 1.1906, "step": 20033 }, { "epoch": 0.6, "learning_rate": 1.7930201354540566e-06, "loss": 1.1116, "step": 20034 }, { "epoch": 0.6, "learning_rate": 1.7927861752769651e-06, "loss": 1.1352, "step": 20035 }, { "epoch": 0.6, "learning_rate": 1.792552221832208e-06, "loss": 1.1708, "step": 20036 }, { "epoch": 0.6, "learning_rate": 1.792318275122013e-06, "loss": 1.151, "step": 20037 }, { "epoch": 0.6, "learning_rate": 1.7920843351486073e-06, "loss": 1.0452, "step": 20038 }, { "epoch": 0.6, "learning_rate": 1.7918504019142178e-06, "loss": 1.1716, "step": 20039 }, { "epoch": 0.6, "learning_rate": 1.7916164754210724e-06, "loss": 1.0125, "step": 20040 }, { "epoch": 0.6, "learning_rate": 1.791382555671396e-06, "loss": 1.1174, "step": 20041 }, { "epoch": 0.6, "learning_rate": 1.7911486426674164e-06, "loss": 1.1636, "step": 20042 }, { "epoch": 0.6, "learning_rate": 1.79091473641136e-06, "loss": 1.1584, "step": 20043 }, { "epoch": 0.6, "learning_rate": 1.7906808369054545e-06, "loss": 1.1206, "step": 20044 }, { "epoch": 0.6, "learning_rate": 1.790446944151926e-06, "loss": 1.073, "step": 20045 }, { "epoch": 0.6, "learning_rate": 1.7902130581530004e-06, "loss": 1.0914, "step": 20046 }, { "epoch": 0.6, "learning_rate": 1.7899791789109042e-06, "loss": 1.0983, "step": 20047 }, { "epoch": 0.6, "learning_rate": 1.789745306427865e-06, "loss": 1.201, "step": 20048 }, { "epoch": 0.6, "learning_rate": 1.7895114407061078e-06, "loss": 1.1578, "step": 20049 }, { "epoch": 0.6, "learning_rate": 1.7892775817478596e-06, "loss": 0.9492, "step": 20050 }, { "epoch": 0.6, "learning_rate": 1.7890437295553464e-06, "loss": 1.2173, "step": 20051 }, { "epoch": 0.6, "learning_rate": 1.788809884130796e-06, "loss": 1.1174, "step": 20052 }, { "epoch": 0.6, "learning_rate": 1.7885760454764316e-06, "loss": 1.0229, "step": 20053 }, { "epoch": 0.6, "learning_rate": 1.7883422135944806e-06, "loss": 1.0797, "step": 20054 }, { "epoch": 0.6, "learning_rate": 1.7881083884871691e-06, "loss": 1.0804, "step": 20055 }, { "epoch": 0.6, "learning_rate": 1.7878745701567226e-06, "loss": 1.1874, "step": 20056 }, { "epoch": 0.6, "learning_rate": 1.7876407586053684e-06, "loss": 1.1908, "step": 20057 }, { "epoch": 0.6, "learning_rate": 1.7874069538353303e-06, "loss": 1.1255, "step": 20058 }, { "epoch": 0.6, "learning_rate": 1.7871731558488345e-06, "loss": 1.0368, "step": 20059 }, { "epoch": 0.6, "learning_rate": 1.7869393646481071e-06, "loss": 1.1204, "step": 20060 }, { "epoch": 0.6, "learning_rate": 1.7867055802353738e-06, "loss": 1.141, "step": 20061 }, { "epoch": 0.6, "learning_rate": 1.7864718026128596e-06, "loss": 1.1223, "step": 20062 }, { "epoch": 0.6, "learning_rate": 1.7862380317827905e-06, "loss": 1.1036, "step": 20063 }, { "epoch": 0.6, "learning_rate": 1.786004267747391e-06, "loss": 1.0153, "step": 20064 }, { "epoch": 0.6, "learning_rate": 1.7857705105088882e-06, "loss": 1.0723, "step": 20065 }, { "epoch": 0.6, "learning_rate": 1.785536760069505e-06, "loss": 1.0894, "step": 20066 }, { "epoch": 0.6, "learning_rate": 1.785303016431468e-06, "loss": 1.1023, "step": 20067 }, { "epoch": 0.6, "learning_rate": 1.785069279597002e-06, "loss": 1.0361, "step": 20068 }, { "epoch": 0.6, "learning_rate": 1.7848355495683324e-06, "loss": 1.0189, "step": 20069 }, { "epoch": 0.6, "learning_rate": 1.7846018263476845e-06, "loss": 1.2271, "step": 20070 }, { "epoch": 0.6, "learning_rate": 1.7843681099372816e-06, "loss": 1.1506, "step": 20071 }, { "epoch": 0.6, "learning_rate": 1.7841344003393503e-06, "loss": 1.1088, "step": 20072 }, { "epoch": 0.6, "learning_rate": 1.783900697556114e-06, "loss": 1.1296, "step": 20073 }, { "epoch": 0.6, "learning_rate": 1.7836670015897988e-06, "loss": 1.0932, "step": 20074 }, { "epoch": 0.6, "learning_rate": 1.7834333124426284e-06, "loss": 1.0684, "step": 20075 }, { "epoch": 0.6, "learning_rate": 1.7831996301168277e-06, "loss": 1.181, "step": 20076 }, { "epoch": 0.6, "learning_rate": 1.7829659546146216e-06, "loss": 1.0178, "step": 20077 }, { "epoch": 0.6, "learning_rate": 1.7827322859382351e-06, "loss": 1.0263, "step": 20078 }, { "epoch": 0.6, "learning_rate": 1.7824986240898907e-06, "loss": 1.1072, "step": 20079 }, { "epoch": 0.6, "learning_rate": 1.7822649690718135e-06, "loss": 1.2153, "step": 20080 }, { "epoch": 0.6, "learning_rate": 1.782031320886229e-06, "loss": 1.2266, "step": 20081 }, { "epoch": 0.6, "learning_rate": 1.7817976795353597e-06, "loss": 1.0706, "step": 20082 }, { "epoch": 0.61, "learning_rate": 1.781564045021432e-06, "loss": 1.149, "step": 20083 }, { "epoch": 0.61, "learning_rate": 1.7813304173466674e-06, "loss": 1.0936, "step": 20084 }, { "epoch": 0.61, "learning_rate": 1.7810967965132914e-06, "loss": 1.0762, "step": 20085 }, { "epoch": 0.61, "learning_rate": 1.7808631825235274e-06, "loss": 1.0901, "step": 20086 }, { "epoch": 0.61, "learning_rate": 1.7806295753796e-06, "loss": 1.2012, "step": 20087 }, { "epoch": 0.61, "learning_rate": 1.7803959750837324e-06, "loss": 1.077, "step": 20088 }, { "epoch": 0.61, "learning_rate": 1.780162381638148e-06, "loss": 1.1071, "step": 20089 }, { "epoch": 0.61, "learning_rate": 1.7799287950450717e-06, "loss": 1.1374, "step": 20090 }, { "epoch": 0.61, "learning_rate": 1.7796952153067271e-06, "loss": 0.9744, "step": 20091 }, { "epoch": 0.61, "learning_rate": 1.7794616424253362e-06, "loss": 1.1335, "step": 20092 }, { "epoch": 0.61, "learning_rate": 1.7792280764031233e-06, "loss": 1.0871, "step": 20093 }, { "epoch": 0.61, "learning_rate": 1.7789945172423124e-06, "loss": 1.0684, "step": 20094 }, { "epoch": 0.61, "learning_rate": 1.778760964945126e-06, "loss": 1.1111, "step": 20095 }, { "epoch": 0.61, "learning_rate": 1.7785274195137893e-06, "loss": 1.1359, "step": 20096 }, { "epoch": 0.61, "learning_rate": 1.7782938809505224e-06, "loss": 1.1425, "step": 20097 }, { "epoch": 0.61, "learning_rate": 1.7780603492575503e-06, "loss": 1.1142, "step": 20098 }, { "epoch": 0.61, "learning_rate": 1.7778268244370966e-06, "loss": 1.0266, "step": 20099 }, { "epoch": 0.61, "learning_rate": 1.777593306491384e-06, "loss": 1.1685, "step": 20100 }, { "epoch": 0.61, "learning_rate": 1.7773597954226346e-06, "loss": 1.0294, "step": 20101 }, { "epoch": 0.61, "learning_rate": 1.7771262912330718e-06, "loss": 1.1239, "step": 20102 }, { "epoch": 0.61, "learning_rate": 1.7768927939249186e-06, "loss": 1.0851, "step": 20103 }, { "epoch": 0.61, "learning_rate": 1.7766593035003986e-06, "loss": 1.1198, "step": 20104 }, { "epoch": 0.61, "learning_rate": 1.7764258199617329e-06, "loss": 1.1829, "step": 20105 }, { "epoch": 0.61, "learning_rate": 1.776192343311145e-06, "loss": 1.2559, "step": 20106 }, { "epoch": 0.61, "learning_rate": 1.775958873550857e-06, "loss": 1.0566, "step": 20107 }, { "epoch": 0.61, "learning_rate": 1.7757254106830923e-06, "loss": 1.1425, "step": 20108 }, { "epoch": 0.61, "learning_rate": 1.7754919547100735e-06, "loss": 0.9457, "step": 20109 }, { "epoch": 0.61, "learning_rate": 1.7752585056340216e-06, "loss": 1.1156, "step": 20110 }, { "epoch": 0.61, "learning_rate": 1.7750250634571595e-06, "loss": 1.1622, "step": 20111 }, { "epoch": 0.61, "learning_rate": 1.7747916281817096e-06, "loss": 0.9607, "step": 20112 }, { "epoch": 0.61, "learning_rate": 1.7745581998098948e-06, "loss": 1.0823, "step": 20113 }, { "epoch": 0.61, "learning_rate": 1.774324778343936e-06, "loss": 1.1738, "step": 20114 }, { "epoch": 0.61, "learning_rate": 1.7740913637860557e-06, "loss": 1.0475, "step": 20115 }, { "epoch": 0.61, "learning_rate": 1.7738579561384761e-06, "loss": 1.1296, "step": 20116 }, { "epoch": 0.61, "learning_rate": 1.77362455540342e-06, "loss": 1.0861, "step": 20117 }, { "epoch": 0.61, "learning_rate": 1.7733911615831073e-06, "loss": 1.2208, "step": 20118 }, { "epoch": 0.61, "learning_rate": 1.773157774679761e-06, "loss": 1.064, "step": 20119 }, { "epoch": 0.61, "learning_rate": 1.7729243946956027e-06, "loss": 1.1283, "step": 20120 }, { "epoch": 0.61, "learning_rate": 1.7726910216328536e-06, "loss": 1.12, "step": 20121 }, { "epoch": 0.61, "learning_rate": 1.7724576554937368e-06, "loss": 0.9951, "step": 20122 }, { "epoch": 0.61, "learning_rate": 1.7722242962804717e-06, "loss": 1.2339, "step": 20123 }, { "epoch": 0.61, "learning_rate": 1.7719909439952809e-06, "loss": 1.0972, "step": 20124 }, { "epoch": 0.61, "learning_rate": 1.7717575986403858e-06, "loss": 1.0711, "step": 20125 }, { "epoch": 0.61, "learning_rate": 1.7715242602180077e-06, "loss": 1.0701, "step": 20126 }, { "epoch": 0.61, "learning_rate": 1.7712909287303675e-06, "loss": 1.063, "step": 20127 }, { "epoch": 0.61, "learning_rate": 1.7710576041796873e-06, "loss": 1.0916, "step": 20128 }, { "epoch": 0.61, "learning_rate": 1.7708242865681874e-06, "loss": 1.0329, "step": 20129 }, { "epoch": 0.61, "learning_rate": 1.7705909758980891e-06, "loss": 1.1337, "step": 20130 }, { "epoch": 0.61, "learning_rate": 1.7703576721716131e-06, "loss": 1.2198, "step": 20131 }, { "epoch": 0.61, "learning_rate": 1.7701243753909809e-06, "loss": 1.0698, "step": 20132 }, { "epoch": 0.61, "learning_rate": 1.7698910855584128e-06, "loss": 1.1767, "step": 20133 }, { "epoch": 0.61, "learning_rate": 1.7696578026761299e-06, "loss": 1.1614, "step": 20134 }, { "epoch": 0.61, "learning_rate": 1.7694245267463542e-06, "loss": 0.9735, "step": 20135 }, { "epoch": 0.61, "learning_rate": 1.7691912577713038e-06, "loss": 1.1478, "step": 20136 }, { "epoch": 0.61, "learning_rate": 1.768957995753201e-06, "loss": 1.1613, "step": 20137 }, { "epoch": 0.61, "learning_rate": 1.768724740694266e-06, "loss": 1.1635, "step": 20138 }, { "epoch": 0.61, "learning_rate": 1.7684914925967202e-06, "loss": 1.0972, "step": 20139 }, { "epoch": 0.61, "learning_rate": 1.768258251462782e-06, "loss": 1.0757, "step": 20140 }, { "epoch": 0.61, "learning_rate": 1.768025017294673e-06, "loss": 1.0436, "step": 20141 }, { "epoch": 0.61, "learning_rate": 1.767791790094613e-06, "loss": 1.1481, "step": 20142 }, { "epoch": 0.61, "learning_rate": 1.7675585698648234e-06, "loss": 1.17, "step": 20143 }, { "epoch": 0.61, "learning_rate": 1.7673253566075226e-06, "loss": 1.0524, "step": 20144 }, { "epoch": 0.61, "learning_rate": 1.7670921503249319e-06, "loss": 1.0195, "step": 20145 }, { "epoch": 0.61, "learning_rate": 1.7668589510192707e-06, "loss": 1.0595, "step": 20146 }, { "epoch": 0.61, "learning_rate": 1.7666257586927592e-06, "loss": 1.119, "step": 20147 }, { "epoch": 0.61, "learning_rate": 1.7663925733476183e-06, "loss": 1.2543, "step": 20148 }, { "epoch": 0.61, "learning_rate": 1.7661593949860662e-06, "loss": 1.2253, "step": 20149 }, { "epoch": 0.61, "learning_rate": 1.7659262236103224e-06, "loss": 1.1647, "step": 20150 }, { "epoch": 0.61, "learning_rate": 1.7656930592226079e-06, "loss": 1.0472, "step": 20151 }, { "epoch": 0.61, "learning_rate": 1.7654599018251429e-06, "loss": 1.1239, "step": 20152 }, { "epoch": 0.61, "learning_rate": 1.7652267514201449e-06, "loss": 1.1552, "step": 20153 }, { "epoch": 0.61, "learning_rate": 1.764993608009834e-06, "loss": 1.1569, "step": 20154 }, { "epoch": 0.61, "learning_rate": 1.76476047159643e-06, "loss": 1.1062, "step": 20155 }, { "epoch": 0.61, "learning_rate": 1.764527342182153e-06, "loss": 1.1861, "step": 20156 }, { "epoch": 0.61, "learning_rate": 1.764294219769221e-06, "loss": 1.1324, "step": 20157 }, { "epoch": 0.61, "learning_rate": 1.7640611043598536e-06, "loss": 1.0588, "step": 20158 }, { "epoch": 0.61, "learning_rate": 1.7638279959562699e-06, "loss": 1.1172, "step": 20159 }, { "epoch": 0.61, "learning_rate": 1.763594894560689e-06, "loss": 0.9903, "step": 20160 }, { "epoch": 0.61, "learning_rate": 1.7633618001753314e-06, "loss": 1.2153, "step": 20161 }, { "epoch": 0.61, "learning_rate": 1.7631287128024134e-06, "loss": 1.079, "step": 20162 }, { "epoch": 0.61, "learning_rate": 1.7628956324441554e-06, "loss": 1.1052, "step": 20163 }, { "epoch": 0.61, "learning_rate": 1.7626625591027757e-06, "loss": 1.0496, "step": 20164 }, { "epoch": 0.61, "learning_rate": 1.7624294927804946e-06, "loss": 1.0941, "step": 20165 }, { "epoch": 0.61, "learning_rate": 1.7621964334795286e-06, "loss": 1.1921, "step": 20166 }, { "epoch": 0.61, "learning_rate": 1.761963381202097e-06, "loss": 1.1358, "step": 20167 }, { "epoch": 0.61, "learning_rate": 1.7617303359504184e-06, "loss": 1.0264, "step": 20168 }, { "epoch": 0.61, "learning_rate": 1.7614972977267122e-06, "loss": 1.0682, "step": 20169 }, { "epoch": 0.61, "learning_rate": 1.7612642665331955e-06, "loss": 1.1167, "step": 20170 }, { "epoch": 0.61, "learning_rate": 1.7610312423720872e-06, "loss": 1.1274, "step": 20171 }, { "epoch": 0.61, "learning_rate": 1.7607982252456056e-06, "loss": 1.0452, "step": 20172 }, { "epoch": 0.61, "learning_rate": 1.7605652151559689e-06, "loss": 1.1003, "step": 20173 }, { "epoch": 0.61, "learning_rate": 1.7603322121053962e-06, "loss": 1.046, "step": 20174 }, { "epoch": 0.61, "learning_rate": 1.7600992160961033e-06, "loss": 1.0183, "step": 20175 }, { "epoch": 0.61, "learning_rate": 1.75986622713031e-06, "loss": 1.1202, "step": 20176 }, { "epoch": 0.61, "learning_rate": 1.7596332452102332e-06, "loss": 1.0506, "step": 20177 }, { "epoch": 0.61, "learning_rate": 1.759400270338093e-06, "loss": 1.1081, "step": 20178 }, { "epoch": 0.61, "learning_rate": 1.7591673025161042e-06, "loss": 1.1375, "step": 20179 }, { "epoch": 0.61, "learning_rate": 1.7589343417464856e-06, "loss": 1.0924, "step": 20180 }, { "epoch": 0.61, "learning_rate": 1.7587013880314558e-06, "loss": 1.1103, "step": 20181 }, { "epoch": 0.61, "learning_rate": 1.7584684413732317e-06, "loss": 1.1449, "step": 20182 }, { "epoch": 0.61, "learning_rate": 1.7582355017740304e-06, "loss": 1.0456, "step": 20183 }, { "epoch": 0.61, "learning_rate": 1.7580025692360702e-06, "loss": 1.0999, "step": 20184 }, { "epoch": 0.61, "learning_rate": 1.7577696437615682e-06, "loss": 1.0911, "step": 20185 }, { "epoch": 0.61, "learning_rate": 1.7575367253527414e-06, "loss": 1.1414, "step": 20186 }, { "epoch": 0.61, "learning_rate": 1.7573038140118087e-06, "loss": 1.2897, "step": 20187 }, { "epoch": 0.61, "learning_rate": 1.757070909740985e-06, "loss": 1.107, "step": 20188 }, { "epoch": 0.61, "learning_rate": 1.7568380125424883e-06, "loss": 1.2739, "step": 20189 }, { "epoch": 0.61, "learning_rate": 1.7566051224185357e-06, "loss": 1.0771, "step": 20190 }, { "epoch": 0.61, "learning_rate": 1.7563722393713456e-06, "loss": 1.2247, "step": 20191 }, { "epoch": 0.61, "learning_rate": 1.7561393634031324e-06, "loss": 1.1463, "step": 20192 }, { "epoch": 0.61, "learning_rate": 1.7559064945161142e-06, "loss": 1.0013, "step": 20193 }, { "epoch": 0.61, "learning_rate": 1.7556736327125079e-06, "loss": 1.2675, "step": 20194 }, { "epoch": 0.61, "learning_rate": 1.7554407779945304e-06, "loss": 1.0573, "step": 20195 }, { "epoch": 0.61, "learning_rate": 1.755207930364398e-06, "loss": 1.0101, "step": 20196 }, { "epoch": 0.61, "learning_rate": 1.7549750898243273e-06, "loss": 1.1189, "step": 20197 }, { "epoch": 0.61, "learning_rate": 1.7547422563765346e-06, "loss": 1.1104, "step": 20198 }, { "epoch": 0.61, "learning_rate": 1.7545094300232373e-06, "loss": 1.1859, "step": 20199 }, { "epoch": 0.61, "learning_rate": 1.7542766107666514e-06, "loss": 1.0421, "step": 20200 }, { "epoch": 0.61, "learning_rate": 1.7540437986089925e-06, "loss": 1.1125, "step": 20201 }, { "epoch": 0.61, "learning_rate": 1.7538109935524772e-06, "loss": 1.0606, "step": 20202 }, { "epoch": 0.61, "learning_rate": 1.753578195599322e-06, "loss": 1.0841, "step": 20203 }, { "epoch": 0.61, "learning_rate": 1.753345404751744e-06, "loss": 0.9877, "step": 20204 }, { "epoch": 0.61, "learning_rate": 1.753112621011957e-06, "loss": 1.1541, "step": 20205 }, { "epoch": 0.61, "learning_rate": 1.7528798443821782e-06, "loss": 1.1722, "step": 20206 }, { "epoch": 0.61, "learning_rate": 1.7526470748646231e-06, "loss": 1.1609, "step": 20207 }, { "epoch": 0.61, "learning_rate": 1.7524143124615088e-06, "loss": 1.1108, "step": 20208 }, { "epoch": 0.61, "learning_rate": 1.7521815571750494e-06, "loss": 1.0745, "step": 20209 }, { "epoch": 0.61, "learning_rate": 1.7519488090074622e-06, "loss": 1.2244, "step": 20210 }, { "epoch": 0.61, "learning_rate": 1.7517160679609615e-06, "loss": 1.0923, "step": 20211 }, { "epoch": 0.61, "learning_rate": 1.7514833340377635e-06, "loss": 1.2546, "step": 20212 }, { "epoch": 0.61, "learning_rate": 1.751250607240084e-06, "loss": 1.134, "step": 20213 }, { "epoch": 0.61, "learning_rate": 1.7510178875701377e-06, "loss": 1.109, "step": 20214 }, { "epoch": 0.61, "learning_rate": 1.7507851750301401e-06, "loss": 1.1544, "step": 20215 }, { "epoch": 0.61, "learning_rate": 1.7505524696223071e-06, "loss": 1.1405, "step": 20216 }, { "epoch": 0.61, "learning_rate": 1.7503197713488548e-06, "loss": 1.2814, "step": 20217 }, { "epoch": 0.61, "learning_rate": 1.7500870802119962e-06, "loss": 1.0562, "step": 20218 }, { "epoch": 0.61, "learning_rate": 1.7498543962139469e-06, "loss": 1.0485, "step": 20219 }, { "epoch": 0.61, "learning_rate": 1.7496217193569232e-06, "loss": 1.1251, "step": 20220 }, { "epoch": 0.61, "learning_rate": 1.7493890496431397e-06, "loss": 1.195, "step": 20221 }, { "epoch": 0.61, "learning_rate": 1.7491563870748102e-06, "loss": 1.0358, "step": 20222 }, { "epoch": 0.61, "learning_rate": 1.74892373165415e-06, "loss": 1.0673, "step": 20223 }, { "epoch": 0.61, "learning_rate": 1.7486910833833748e-06, "loss": 1.1752, "step": 20224 }, { "epoch": 0.61, "learning_rate": 1.748458442264699e-06, "loss": 1.0399, "step": 20225 }, { "epoch": 0.61, "learning_rate": 1.748225808300336e-06, "loss": 1.1281, "step": 20226 }, { "epoch": 0.61, "learning_rate": 1.7479931814925011e-06, "loss": 1.2013, "step": 20227 }, { "epoch": 0.61, "learning_rate": 1.7477605618434093e-06, "loss": 1.1215, "step": 20228 }, { "epoch": 0.61, "learning_rate": 1.7475279493552747e-06, "loss": 1.1946, "step": 20229 }, { "epoch": 0.61, "learning_rate": 1.7472953440303126e-06, "loss": 1.0787, "step": 20230 }, { "epoch": 0.61, "learning_rate": 1.747062745870735e-06, "loss": 1.2128, "step": 20231 }, { "epoch": 0.61, "learning_rate": 1.7468301548787576e-06, "loss": 1.0733, "step": 20232 }, { "epoch": 0.61, "learning_rate": 1.7465975710565946e-06, "loss": 1.1057, "step": 20233 }, { "epoch": 0.61, "learning_rate": 1.7463649944064606e-06, "loss": 1.1359, "step": 20234 }, { "epoch": 0.61, "learning_rate": 1.7461324249305677e-06, "loss": 1.0006, "step": 20235 }, { "epoch": 0.61, "learning_rate": 1.7458998626311317e-06, "loss": 1.2484, "step": 20236 }, { "epoch": 0.61, "learning_rate": 1.7456673075103653e-06, "loss": 0.9534, "step": 20237 }, { "epoch": 0.61, "learning_rate": 1.7454347595704835e-06, "loss": 1.0474, "step": 20238 }, { "epoch": 0.61, "learning_rate": 1.7452022188136988e-06, "loss": 1.2321, "step": 20239 }, { "epoch": 0.61, "learning_rate": 1.7449696852422254e-06, "loss": 1.0316, "step": 20240 }, { "epoch": 0.61, "learning_rate": 1.7447371588582774e-06, "loss": 1.1091, "step": 20241 }, { "epoch": 0.61, "learning_rate": 1.7445046396640675e-06, "loss": 1.0366, "step": 20242 }, { "epoch": 0.61, "learning_rate": 1.7442721276618105e-06, "loss": 1.1499, "step": 20243 }, { "epoch": 0.61, "learning_rate": 1.7440396228537183e-06, "loss": 1.1652, "step": 20244 }, { "epoch": 0.61, "learning_rate": 1.7438071252420041e-06, "loss": 1.1909, "step": 20245 }, { "epoch": 0.61, "learning_rate": 1.7435746348288823e-06, "loss": 1.0298, "step": 20246 }, { "epoch": 0.61, "learning_rate": 1.743342151616567e-06, "loss": 1.0809, "step": 20247 }, { "epoch": 0.61, "learning_rate": 1.7431096756072686e-06, "loss": 1.1656, "step": 20248 }, { "epoch": 0.61, "learning_rate": 1.7428772068032015e-06, "loss": 1.1534, "step": 20249 }, { "epoch": 0.61, "learning_rate": 1.7426447452065787e-06, "loss": 1.1778, "step": 20250 }, { "epoch": 0.61, "learning_rate": 1.742412290819614e-06, "loss": 1.1065, "step": 20251 }, { "epoch": 0.61, "learning_rate": 1.7421798436445187e-06, "loss": 1.2784, "step": 20252 }, { "epoch": 0.61, "learning_rate": 1.7419474036835066e-06, "loss": 1.1086, "step": 20253 }, { "epoch": 0.61, "learning_rate": 1.7417149709387898e-06, "loss": 1.1354, "step": 20254 }, { "epoch": 0.61, "learning_rate": 1.7414825454125811e-06, "loss": 1.1271, "step": 20255 }, { "epoch": 0.61, "learning_rate": 1.7412501271070948e-06, "loss": 1.2703, "step": 20256 }, { "epoch": 0.61, "learning_rate": 1.7410177160245407e-06, "loss": 1.072, "step": 20257 }, { "epoch": 0.61, "learning_rate": 1.7407853121671319e-06, "loss": 1.0333, "step": 20258 }, { "epoch": 0.61, "learning_rate": 1.740552915537082e-06, "loss": 1.0751, "step": 20259 }, { "epoch": 0.61, "learning_rate": 1.740320526136603e-06, "loss": 1.1567, "step": 20260 }, { "epoch": 0.61, "learning_rate": 1.7400881439679062e-06, "loss": 1.1755, "step": 20261 }, { "epoch": 0.61, "learning_rate": 1.7398557690332041e-06, "loss": 1.1356, "step": 20262 }, { "epoch": 0.61, "learning_rate": 1.7396234013347088e-06, "loss": 1.0747, "step": 20263 }, { "epoch": 0.61, "learning_rate": 1.739391040874633e-06, "loss": 1.0604, "step": 20264 }, { "epoch": 0.61, "learning_rate": 1.739158687655188e-06, "loss": 1.0441, "step": 20265 }, { "epoch": 0.61, "learning_rate": 1.7389263416785856e-06, "loss": 1.0993, "step": 20266 }, { "epoch": 0.61, "learning_rate": 1.738694002947038e-06, "loss": 1.0006, "step": 20267 }, { "epoch": 0.61, "learning_rate": 1.7384616714627567e-06, "loss": 1.1021, "step": 20268 }, { "epoch": 0.61, "learning_rate": 1.7382293472279545e-06, "loss": 1.0762, "step": 20269 }, { "epoch": 0.61, "learning_rate": 1.7379970302448412e-06, "loss": 1.0817, "step": 20270 }, { "epoch": 0.61, "learning_rate": 1.7377647205156292e-06, "loss": 1.0563, "step": 20271 }, { "epoch": 0.61, "learning_rate": 1.73753241804253e-06, "loss": 1.0995, "step": 20272 }, { "epoch": 0.61, "learning_rate": 1.7373001228277558e-06, "loss": 1.2306, "step": 20273 }, { "epoch": 0.61, "learning_rate": 1.737067834873516e-06, "loss": 1.2653, "step": 20274 }, { "epoch": 0.61, "learning_rate": 1.7368355541820232e-06, "loss": 1.0119, "step": 20275 }, { "epoch": 0.61, "learning_rate": 1.7366032807554884e-06, "loss": 1.1311, "step": 20276 }, { "epoch": 0.61, "learning_rate": 1.736371014596123e-06, "loss": 1.1301, "step": 20277 }, { "epoch": 0.61, "learning_rate": 1.7361387557061371e-06, "loss": 1.0955, "step": 20278 }, { "epoch": 0.61, "learning_rate": 1.7359065040877427e-06, "loss": 1.1589, "step": 20279 }, { "epoch": 0.61, "learning_rate": 1.7356742597431504e-06, "loss": 1.2642, "step": 20280 }, { "epoch": 0.61, "learning_rate": 1.7354420226745714e-06, "loss": 1.1, "step": 20281 }, { "epoch": 0.61, "learning_rate": 1.735209792884216e-06, "loss": 1.1569, "step": 20282 }, { "epoch": 0.61, "learning_rate": 1.734977570374295e-06, "loss": 1.0859, "step": 20283 }, { "epoch": 0.61, "learning_rate": 1.7347453551470186e-06, "loss": 1.112, "step": 20284 }, { "epoch": 0.61, "learning_rate": 1.7345131472045979e-06, "loss": 1.158, "step": 20285 }, { "epoch": 0.61, "learning_rate": 1.7342809465492447e-06, "loss": 1.1807, "step": 20286 }, { "epoch": 0.61, "learning_rate": 1.7340487531831668e-06, "loss": 1.1459, "step": 20287 }, { "epoch": 0.61, "learning_rate": 1.733816567108576e-06, "loss": 1.0859, "step": 20288 }, { "epoch": 0.61, "learning_rate": 1.7335843883276827e-06, "loss": 1.2144, "step": 20289 }, { "epoch": 0.61, "learning_rate": 1.7333522168426969e-06, "loss": 1.0435, "step": 20290 }, { "epoch": 0.61, "learning_rate": 1.7331200526558285e-06, "loss": 1.0164, "step": 20291 }, { "epoch": 0.61, "learning_rate": 1.7328878957692884e-06, "loss": 1.1898, "step": 20292 }, { "epoch": 0.61, "learning_rate": 1.7326557461852856e-06, "loss": 1.123, "step": 20293 }, { "epoch": 0.61, "learning_rate": 1.7324236039060306e-06, "loss": 1.1381, "step": 20294 }, { "epoch": 0.61, "learning_rate": 1.7321914689337332e-06, "loss": 1.1229, "step": 20295 }, { "epoch": 0.61, "learning_rate": 1.7319593412706032e-06, "loss": 1.1104, "step": 20296 }, { "epoch": 0.61, "learning_rate": 1.7317272209188505e-06, "loss": 1.1221, "step": 20297 }, { "epoch": 0.61, "learning_rate": 1.731495107880684e-06, "loss": 1.1022, "step": 20298 }, { "epoch": 0.61, "learning_rate": 1.7312630021583156e-06, "loss": 1.1568, "step": 20299 }, { "epoch": 0.61, "learning_rate": 1.7310309037539519e-06, "loss": 0.9467, "step": 20300 }, { "epoch": 0.61, "learning_rate": 1.730798812669804e-06, "loss": 1.1472, "step": 20301 }, { "epoch": 0.61, "learning_rate": 1.7305667289080805e-06, "loss": 1.0687, "step": 20302 }, { "epoch": 0.61, "learning_rate": 1.7303346524709924e-06, "loss": 1.069, "step": 20303 }, { "epoch": 0.61, "learning_rate": 1.7301025833607466e-06, "loss": 1.0685, "step": 20304 }, { "epoch": 0.61, "learning_rate": 1.7298705215795535e-06, "loss": 1.1619, "step": 20305 }, { "epoch": 0.61, "learning_rate": 1.7296384671296221e-06, "loss": 1.1852, "step": 20306 }, { "epoch": 0.61, "learning_rate": 1.7294064200131615e-06, "loss": 1.1224, "step": 20307 }, { "epoch": 0.61, "learning_rate": 1.729174380232381e-06, "loss": 1.2053, "step": 20308 }, { "epoch": 0.61, "learning_rate": 1.728942347789489e-06, "loss": 1.207, "step": 20309 }, { "epoch": 0.61, "learning_rate": 1.728710322686694e-06, "loss": 1.2074, "step": 20310 }, { "epoch": 0.61, "learning_rate": 1.7284783049262055e-06, "loss": 1.0844, "step": 20311 }, { "epoch": 0.61, "learning_rate": 1.728246294510233e-06, "loss": 1.0509, "step": 20312 }, { "epoch": 0.61, "learning_rate": 1.728014291440983e-06, "loss": 1.0944, "step": 20313 }, { "epoch": 0.61, "learning_rate": 1.7277822957206652e-06, "loss": 1.1445, "step": 20314 }, { "epoch": 0.61, "learning_rate": 1.7275503073514882e-06, "loss": 1.1318, "step": 20315 }, { "epoch": 0.61, "learning_rate": 1.7273183263356613e-06, "loss": 1.0712, "step": 20316 }, { "epoch": 0.61, "learning_rate": 1.7270863526753906e-06, "loss": 1.3031, "step": 20317 }, { "epoch": 0.61, "learning_rate": 1.7268543863728854e-06, "loss": 1.0551, "step": 20318 }, { "epoch": 0.61, "learning_rate": 1.7266224274303544e-06, "loss": 1.0959, "step": 20319 }, { "epoch": 0.61, "learning_rate": 1.726390475850005e-06, "loss": 1.11, "step": 20320 }, { "epoch": 0.61, "learning_rate": 1.7261585316340468e-06, "loss": 1.2643, "step": 20321 }, { "epoch": 0.61, "learning_rate": 1.7259265947846856e-06, "loss": 1.0574, "step": 20322 }, { "epoch": 0.61, "learning_rate": 1.7256946653041306e-06, "loss": 1.2032, "step": 20323 }, { "epoch": 0.61, "learning_rate": 1.7254627431945898e-06, "loss": 1.1876, "step": 20324 }, { "epoch": 0.61, "learning_rate": 1.7252308284582713e-06, "loss": 1.1813, "step": 20325 }, { "epoch": 0.61, "learning_rate": 1.724998921097381e-06, "loss": 1.0862, "step": 20326 }, { "epoch": 0.61, "learning_rate": 1.7247670211141283e-06, "loss": 1.124, "step": 20327 }, { "epoch": 0.61, "learning_rate": 1.7245351285107197e-06, "loss": 1.0413, "step": 20328 }, { "epoch": 0.61, "learning_rate": 1.7243032432893644e-06, "loss": 1.1553, "step": 20329 }, { "epoch": 0.61, "learning_rate": 1.7240713654522675e-06, "loss": 1.0948, "step": 20330 }, { "epoch": 0.61, "learning_rate": 1.7238394950016377e-06, "loss": 1.3054, "step": 20331 }, { "epoch": 0.61, "learning_rate": 1.723607631939682e-06, "loss": 1.1418, "step": 20332 }, { "epoch": 0.61, "learning_rate": 1.7233757762686076e-06, "loss": 1.0972, "step": 20333 }, { "epoch": 0.61, "learning_rate": 1.7231439279906227e-06, "loss": 1.0348, "step": 20334 }, { "epoch": 0.61, "learning_rate": 1.7229120871079325e-06, "loss": 1.1414, "step": 20335 }, { "epoch": 0.61, "learning_rate": 1.7226802536227449e-06, "loss": 1.0862, "step": 20336 }, { "epoch": 0.61, "learning_rate": 1.722448427537267e-06, "loss": 1.1132, "step": 20337 }, { "epoch": 0.61, "learning_rate": 1.722216608853707e-06, "loss": 1.0273, "step": 20338 }, { "epoch": 0.61, "learning_rate": 1.721984797574269e-06, "loss": 1.0498, "step": 20339 }, { "epoch": 0.61, "learning_rate": 1.7217529937011612e-06, "loss": 1.1033, "step": 20340 }, { "epoch": 0.61, "learning_rate": 1.7215211972365897e-06, "loss": 1.1017, "step": 20341 }, { "epoch": 0.61, "learning_rate": 1.7212894081827627e-06, "loss": 1.1797, "step": 20342 }, { "epoch": 0.61, "learning_rate": 1.7210576265418846e-06, "loss": 1.2015, "step": 20343 }, { "epoch": 0.61, "learning_rate": 1.7208258523161625e-06, "loss": 1.1046, "step": 20344 }, { "epoch": 0.61, "learning_rate": 1.7205940855078032e-06, "loss": 1.1667, "step": 20345 }, { "epoch": 0.61, "learning_rate": 1.7203623261190128e-06, "loss": 1.1823, "step": 20346 }, { "epoch": 0.61, "learning_rate": 1.720130574151998e-06, "loss": 1.248, "step": 20347 }, { "epoch": 0.61, "learning_rate": 1.719898829608964e-06, "loss": 1.0759, "step": 20348 }, { "epoch": 0.61, "learning_rate": 1.7196670924921178e-06, "loss": 1.1426, "step": 20349 }, { "epoch": 0.61, "learning_rate": 1.7194353628036648e-06, "loss": 1.1287, "step": 20350 }, { "epoch": 0.61, "learning_rate": 1.719203640545812e-06, "loss": 1.2123, "step": 20351 }, { "epoch": 0.61, "learning_rate": 1.7189719257207637e-06, "loss": 1.1437, "step": 20352 }, { "epoch": 0.61, "learning_rate": 1.7187402183307267e-06, "loss": 1.1059, "step": 20353 }, { "epoch": 0.61, "learning_rate": 1.7185085183779062e-06, "loss": 1.1215, "step": 20354 }, { "epoch": 0.61, "learning_rate": 1.7182768258645094e-06, "loss": 1.0715, "step": 20355 }, { "epoch": 0.61, "learning_rate": 1.7180451407927398e-06, "loss": 1.2017, "step": 20356 }, { "epoch": 0.61, "learning_rate": 1.7178134631648035e-06, "loss": 1.0624, "step": 20357 }, { "epoch": 0.61, "learning_rate": 1.7175817929829069e-06, "loss": 1.1011, "step": 20358 }, { "epoch": 0.61, "learning_rate": 1.7173501302492545e-06, "loss": 1.0983, "step": 20359 }, { "epoch": 0.61, "learning_rate": 1.7171184749660524e-06, "loss": 1.0333, "step": 20360 }, { "epoch": 0.61, "learning_rate": 1.716886827135505e-06, "loss": 1.1681, "step": 20361 }, { "epoch": 0.61, "learning_rate": 1.7166551867598174e-06, "loss": 1.2614, "step": 20362 }, { "epoch": 0.61, "learning_rate": 1.7164235538411956e-06, "loss": 1.1542, "step": 20363 }, { "epoch": 0.61, "learning_rate": 1.7161919283818451e-06, "loss": 0.9973, "step": 20364 }, { "epoch": 0.61, "learning_rate": 1.715960310383969e-06, "loss": 1.0278, "step": 20365 }, { "epoch": 0.61, "learning_rate": 1.715728699849773e-06, "loss": 1.035, "step": 20366 }, { "epoch": 0.61, "learning_rate": 1.7154970967814622e-06, "loss": 1.1454, "step": 20367 }, { "epoch": 0.61, "learning_rate": 1.715265501181242e-06, "loss": 1.1696, "step": 20368 }, { "epoch": 0.61, "learning_rate": 1.7150339130513156e-06, "loss": 1.159, "step": 20369 }, { "epoch": 0.61, "learning_rate": 1.7148023323938878e-06, "loss": 1.0424, "step": 20370 }, { "epoch": 0.61, "learning_rate": 1.7145707592111638e-06, "loss": 1.094, "step": 20371 }, { "epoch": 0.61, "learning_rate": 1.7143391935053483e-06, "loss": 1.0916, "step": 20372 }, { "epoch": 0.61, "learning_rate": 1.7141076352786453e-06, "loss": 1.039, "step": 20373 }, { "epoch": 0.61, "learning_rate": 1.7138760845332588e-06, "loss": 1.0764, "step": 20374 }, { "epoch": 0.61, "learning_rate": 1.7136445412713943e-06, "loss": 1.1531, "step": 20375 }, { "epoch": 0.61, "learning_rate": 1.7134130054952538e-06, "loss": 1.0704, "step": 20376 }, { "epoch": 0.61, "learning_rate": 1.7131814772070437e-06, "loss": 1.2103, "step": 20377 }, { "epoch": 0.61, "learning_rate": 1.7129499564089662e-06, "loss": 1.2084, "step": 20378 }, { "epoch": 0.61, "learning_rate": 1.7127184431032262e-06, "loss": 1.1597, "step": 20379 }, { "epoch": 0.61, "learning_rate": 1.7124869372920272e-06, "loss": 1.0678, "step": 20380 }, { "epoch": 0.61, "learning_rate": 1.7122554389775747e-06, "loss": 1.0387, "step": 20381 }, { "epoch": 0.61, "learning_rate": 1.71202394816207e-06, "loss": 1.0276, "step": 20382 }, { "epoch": 0.61, "learning_rate": 1.7117924648477174e-06, "loss": 1.1099, "step": 20383 }, { "epoch": 0.61, "learning_rate": 1.711560989036721e-06, "loss": 1.1646, "step": 20384 }, { "epoch": 0.61, "learning_rate": 1.7113295207312844e-06, "loss": 1.129, "step": 20385 }, { "epoch": 0.61, "learning_rate": 1.7110980599336119e-06, "loss": 1.2493, "step": 20386 }, { "epoch": 0.61, "learning_rate": 1.7108666066459052e-06, "loss": 1.1077, "step": 20387 }, { "epoch": 0.61, "learning_rate": 1.7106351608703681e-06, "loss": 1.0812, "step": 20388 }, { "epoch": 0.61, "learning_rate": 1.710403722609204e-06, "loss": 1.0593, "step": 20389 }, { "epoch": 0.61, "learning_rate": 1.7101722918646168e-06, "loss": 1.1075, "step": 20390 }, { "epoch": 0.61, "learning_rate": 1.7099408686388083e-06, "loss": 1.1764, "step": 20391 }, { "epoch": 0.61, "learning_rate": 1.7097094529339825e-06, "loss": 1.1014, "step": 20392 }, { "epoch": 0.61, "learning_rate": 1.7094780447523417e-06, "loss": 1.1923, "step": 20393 }, { "epoch": 0.61, "learning_rate": 1.709246644096091e-06, "loss": 1.1036, "step": 20394 }, { "epoch": 0.61, "learning_rate": 1.7090152509674297e-06, "loss": 1.1027, "step": 20395 }, { "epoch": 0.61, "learning_rate": 1.7087838653685623e-06, "loss": 1.1488, "step": 20396 }, { "epoch": 0.61, "learning_rate": 1.7085524873016915e-06, "loss": 0.981, "step": 20397 }, { "epoch": 0.61, "learning_rate": 1.7083211167690201e-06, "loss": 1.0996, "step": 20398 }, { "epoch": 0.61, "learning_rate": 1.708089753772751e-06, "loss": 1.118, "step": 20399 }, { "epoch": 0.61, "learning_rate": 1.7078583983150853e-06, "loss": 1.3065, "step": 20400 }, { "epoch": 0.61, "learning_rate": 1.7076270503982262e-06, "loss": 1.1934, "step": 20401 }, { "epoch": 0.61, "learning_rate": 1.7073957100243758e-06, "loss": 1.0828, "step": 20402 }, { "epoch": 0.61, "learning_rate": 1.7071643771957368e-06, "loss": 1.0986, "step": 20403 }, { "epoch": 0.61, "learning_rate": 1.706933051914511e-06, "loss": 1.1548, "step": 20404 }, { "epoch": 0.61, "learning_rate": 1.7067017341829003e-06, "loss": 1.1533, "step": 20405 }, { "epoch": 0.61, "learning_rate": 1.706470424003107e-06, "loss": 1.3866, "step": 20406 }, { "epoch": 0.61, "learning_rate": 1.7062391213773343e-06, "loss": 1.0438, "step": 20407 }, { "epoch": 0.61, "learning_rate": 1.706007826307782e-06, "loss": 1.063, "step": 20408 }, { "epoch": 0.61, "learning_rate": 1.7057765387966528e-06, "loss": 1.1021, "step": 20409 }, { "epoch": 0.61, "learning_rate": 1.7055452588461479e-06, "loss": 1.1143, "step": 20410 }, { "epoch": 0.61, "learning_rate": 1.7053139864584711e-06, "loss": 1.0845, "step": 20411 }, { "epoch": 0.61, "learning_rate": 1.7050827216358211e-06, "loss": 1.2781, "step": 20412 }, { "epoch": 0.61, "learning_rate": 1.704851464380401e-06, "loss": 1.0727, "step": 20413 }, { "epoch": 0.61, "learning_rate": 1.7046202146944116e-06, "loss": 1.0361, "step": 20414 }, { "epoch": 0.62, "learning_rate": 1.7043889725800549e-06, "loss": 1.0052, "step": 20415 }, { "epoch": 0.62, "learning_rate": 1.7041577380395324e-06, "loss": 1.0577, "step": 20416 }, { "epoch": 0.62, "learning_rate": 1.7039265110750446e-06, "loss": 1.1254, "step": 20417 }, { "epoch": 0.62, "learning_rate": 1.703695291688793e-06, "loss": 1.0786, "step": 20418 }, { "epoch": 0.62, "learning_rate": 1.7034640798829788e-06, "loss": 1.0232, "step": 20419 }, { "epoch": 0.62, "learning_rate": 1.7032328756598037e-06, "loss": 1.0247, "step": 20420 }, { "epoch": 0.62, "learning_rate": 1.703001679021467e-06, "loss": 1.0344, "step": 20421 }, { "epoch": 0.62, "learning_rate": 1.7027704899701706e-06, "loss": 1.0483, "step": 20422 }, { "epoch": 0.62, "learning_rate": 1.7025393085081148e-06, "loss": 1.1572, "step": 20423 }, { "epoch": 0.62, "learning_rate": 1.702308134637502e-06, "loss": 1.1984, "step": 20424 }, { "epoch": 0.62, "learning_rate": 1.7020769683605308e-06, "loss": 1.1572, "step": 20425 }, { "epoch": 0.62, "learning_rate": 1.7018458096794022e-06, "loss": 1.104, "step": 20426 }, { "epoch": 0.62, "learning_rate": 1.7016146585963173e-06, "loss": 1.1666, "step": 20427 }, { "epoch": 0.62, "learning_rate": 1.701383515113476e-06, "loss": 1.154, "step": 20428 }, { "epoch": 0.62, "learning_rate": 1.7011523792330798e-06, "loss": 1.008, "step": 20429 }, { "epoch": 0.62, "learning_rate": 1.7009212509573275e-06, "loss": 1.1021, "step": 20430 }, { "epoch": 0.62, "learning_rate": 1.7006901302884205e-06, "loss": 1.0676, "step": 20431 }, { "epoch": 0.62, "learning_rate": 1.7004590172285578e-06, "loss": 1.0624, "step": 20432 }, { "epoch": 0.62, "learning_rate": 1.700227911779942e-06, "loss": 1.2388, "step": 20433 }, { "epoch": 0.62, "learning_rate": 1.6999968139447698e-06, "loss": 1.1608, "step": 20434 }, { "epoch": 0.62, "learning_rate": 1.6997657237252424e-06, "loss": 1.1814, "step": 20435 }, { "epoch": 0.62, "learning_rate": 1.6995346411235603e-06, "loss": 1.1113, "step": 20436 }, { "epoch": 0.62, "learning_rate": 1.6993035661419238e-06, "loss": 1.1113, "step": 20437 }, { "epoch": 0.62, "learning_rate": 1.6990724987825307e-06, "loss": 1.1016, "step": 20438 }, { "epoch": 0.62, "learning_rate": 1.6988414390475819e-06, "loss": 1.1586, "step": 20439 }, { "epoch": 0.62, "learning_rate": 1.6986103869392764e-06, "loss": 1.058, "step": 20440 }, { "epoch": 0.62, "learning_rate": 1.6983793424598143e-06, "loss": 1.0963, "step": 20441 }, { "epoch": 0.62, "learning_rate": 1.698148305611395e-06, "loss": 1.1208, "step": 20442 }, { "epoch": 0.62, "learning_rate": 1.6979172763962175e-06, "loss": 1.2195, "step": 20443 }, { "epoch": 0.62, "learning_rate": 1.697686254816481e-06, "loss": 1.1544, "step": 20444 }, { "epoch": 0.62, "learning_rate": 1.697455240874385e-06, "loss": 1.0601, "step": 20445 }, { "epoch": 0.62, "learning_rate": 1.6972242345721295e-06, "loss": 1.1862, "step": 20446 }, { "epoch": 0.62, "learning_rate": 1.6969932359119118e-06, "loss": 1.1526, "step": 20447 }, { "epoch": 0.62, "learning_rate": 1.696762244895932e-06, "loss": 1.1654, "step": 20448 }, { "epoch": 0.62, "learning_rate": 1.6965312615263884e-06, "loss": 1.0229, "step": 20449 }, { "epoch": 0.62, "learning_rate": 1.6963002858054812e-06, "loss": 1.1012, "step": 20450 }, { "epoch": 0.62, "learning_rate": 1.6960693177354073e-06, "loss": 1.1776, "step": 20451 }, { "epoch": 0.62, "learning_rate": 1.6958383573183663e-06, "loss": 1.115, "step": 20452 }, { "epoch": 0.62, "learning_rate": 1.6956074045565568e-06, "loss": 1.161, "step": 20453 }, { "epoch": 0.62, "learning_rate": 1.6953764594521777e-06, "loss": 1.1755, "step": 20454 }, { "epoch": 0.62, "learning_rate": 1.6951455220074275e-06, "loss": 1.1993, "step": 20455 }, { "epoch": 0.62, "learning_rate": 1.6949145922245036e-06, "loss": 1.1143, "step": 20456 }, { "epoch": 0.62, "learning_rate": 1.6946836701056058e-06, "loss": 1.1473, "step": 20457 }, { "epoch": 0.62, "learning_rate": 1.6944527556529312e-06, "loss": 1.1415, "step": 20458 }, { "epoch": 0.62, "learning_rate": 1.6942218488686785e-06, "loss": 1.1984, "step": 20459 }, { "epoch": 0.62, "learning_rate": 1.6939909497550455e-06, "loss": 1.1697, "step": 20460 }, { "epoch": 0.62, "learning_rate": 1.6937600583142303e-06, "loss": 1.1544, "step": 20461 }, { "epoch": 0.62, "learning_rate": 1.693529174548431e-06, "loss": 1.0541, "step": 20462 }, { "epoch": 0.62, "learning_rate": 1.6932982984598467e-06, "loss": 1.1233, "step": 20463 }, { "epoch": 0.62, "learning_rate": 1.6930674300506733e-06, "loss": 1.17, "step": 20464 }, { "epoch": 0.62, "learning_rate": 1.692836569323109e-06, "loss": 1.1216, "step": 20465 }, { "epoch": 0.62, "learning_rate": 1.692605716279352e-06, "loss": 1.1564, "step": 20466 }, { "epoch": 0.62, "learning_rate": 1.6923748709215996e-06, "loss": 1.1007, "step": 20467 }, { "epoch": 0.62, "learning_rate": 1.6921440332520506e-06, "loss": 1.109, "step": 20468 }, { "epoch": 0.62, "learning_rate": 1.6919132032729002e-06, "loss": 1.0897, "step": 20469 }, { "epoch": 0.62, "learning_rate": 1.6916823809863469e-06, "loss": 1.1644, "step": 20470 }, { "epoch": 0.62, "learning_rate": 1.691451566394588e-06, "loss": 1.0249, "step": 20471 }, { "epoch": 0.62, "learning_rate": 1.6912207594998215e-06, "loss": 1.0345, "step": 20472 }, { "epoch": 0.62, "learning_rate": 1.6909899603042428e-06, "loss": 1.1662, "step": 20473 }, { "epoch": 0.62, "learning_rate": 1.6907591688100505e-06, "loss": 1.1042, "step": 20474 }, { "epoch": 0.62, "learning_rate": 1.6905283850194414e-06, "loss": 1.0588, "step": 20475 }, { "epoch": 0.62, "learning_rate": 1.690297608934613e-06, "loss": 1.1536, "step": 20476 }, { "epoch": 0.62, "learning_rate": 1.6900668405577603e-06, "loss": 1.0732, "step": 20477 }, { "epoch": 0.62, "learning_rate": 1.6898360798910812e-06, "loss": 1.0789, "step": 20478 }, { "epoch": 0.62, "learning_rate": 1.6896053269367724e-06, "loss": 1.2347, "step": 20479 }, { "epoch": 0.62, "learning_rate": 1.689374581697031e-06, "loss": 1.2316, "step": 20480 }, { "epoch": 0.62, "learning_rate": 1.6891438441740537e-06, "loss": 1.036, "step": 20481 }, { "epoch": 0.62, "learning_rate": 1.6889131143700354e-06, "loss": 1.1569, "step": 20482 }, { "epoch": 0.62, "learning_rate": 1.6886823922871737e-06, "loss": 1.1392, "step": 20483 }, { "epoch": 0.62, "learning_rate": 1.6884516779276651e-06, "loss": 1.1107, "step": 20484 }, { "epoch": 0.62, "learning_rate": 1.688220971293706e-06, "loss": 1.0583, "step": 20485 }, { "epoch": 0.62, "learning_rate": 1.687990272387492e-06, "loss": 1.1496, "step": 20486 }, { "epoch": 0.62, "learning_rate": 1.6877595812112197e-06, "loss": 1.171, "step": 20487 }, { "epoch": 0.62, "learning_rate": 1.6875288977670845e-06, "loss": 1.2709, "step": 20488 }, { "epoch": 0.62, "learning_rate": 1.6872982220572842e-06, "loss": 1.0862, "step": 20489 }, { "epoch": 0.62, "learning_rate": 1.687067554084012e-06, "loss": 1.0618, "step": 20490 }, { "epoch": 0.62, "learning_rate": 1.6868368938494656e-06, "loss": 1.1508, "step": 20491 }, { "epoch": 0.62, "learning_rate": 1.6866062413558404e-06, "loss": 1.1927, "step": 20492 }, { "epoch": 0.62, "learning_rate": 1.6863755966053315e-06, "loss": 1.1035, "step": 20493 }, { "epoch": 0.62, "learning_rate": 1.6861449596001368e-06, "loss": 1.0994, "step": 20494 }, { "epoch": 0.62, "learning_rate": 1.6859143303424486e-06, "loss": 1.1191, "step": 20495 }, { "epoch": 0.62, "learning_rate": 1.685683708834464e-06, "loss": 1.0157, "step": 20496 }, { "epoch": 0.62, "learning_rate": 1.685453095078378e-06, "loss": 1.1529, "step": 20497 }, { "epoch": 0.62, "learning_rate": 1.6852224890763875e-06, "loss": 1.1559, "step": 20498 }, { "epoch": 0.62, "learning_rate": 1.6849918908306856e-06, "loss": 1.0327, "step": 20499 }, { "epoch": 0.62, "learning_rate": 1.6847613003434682e-06, "loss": 1.0403, "step": 20500 }, { "epoch": 0.62, "learning_rate": 1.6845307176169306e-06, "loss": 1.0503, "step": 20501 }, { "epoch": 0.62, "learning_rate": 1.684300142653269e-06, "loss": 1.0583, "step": 20502 }, { "epoch": 0.62, "learning_rate": 1.6840695754546762e-06, "loss": 1.1115, "step": 20503 }, { "epoch": 0.62, "learning_rate": 1.6838390160233482e-06, "loss": 1.1606, "step": 20504 }, { "epoch": 0.62, "learning_rate": 1.6836084643614792e-06, "loss": 1.0912, "step": 20505 }, { "epoch": 0.62, "learning_rate": 1.6833779204712648e-06, "loss": 1.1819, "step": 20506 }, { "epoch": 0.62, "learning_rate": 1.6831473843549004e-06, "loss": 1.1701, "step": 20507 }, { "epoch": 0.62, "learning_rate": 1.682916856014578e-06, "loss": 1.1086, "step": 20508 }, { "epoch": 0.62, "learning_rate": 1.6826863354524942e-06, "loss": 1.0965, "step": 20509 }, { "epoch": 0.62, "learning_rate": 1.6824558226708427e-06, "loss": 1.1295, "step": 20510 }, { "epoch": 0.62, "learning_rate": 1.6822253176718185e-06, "loss": 1.1428, "step": 20511 }, { "epoch": 0.62, "learning_rate": 1.6819948204576148e-06, "loss": 1.1672, "step": 20512 }, { "epoch": 0.62, "learning_rate": 1.6817643310304263e-06, "loss": 1.2443, "step": 20513 }, { "epoch": 0.62, "learning_rate": 1.6815338493924477e-06, "loss": 1.1054, "step": 20514 }, { "epoch": 0.62, "learning_rate": 1.6813033755458733e-06, "loss": 1.1649, "step": 20515 }, { "epoch": 0.62, "learning_rate": 1.6810729094928956e-06, "loss": 1.0629, "step": 20516 }, { "epoch": 0.62, "learning_rate": 1.6808424512357094e-06, "loss": 1.084, "step": 20517 }, { "epoch": 0.62, "learning_rate": 1.6806120007765087e-06, "loss": 1.0858, "step": 20518 }, { "epoch": 0.62, "learning_rate": 1.6803815581174867e-06, "loss": 1.0759, "step": 20519 }, { "epoch": 0.62, "learning_rate": 1.680151123260839e-06, "loss": 1.1282, "step": 20520 }, { "epoch": 0.62, "learning_rate": 1.6799206962087567e-06, "loss": 1.0757, "step": 20521 }, { "epoch": 0.62, "learning_rate": 1.679690276963434e-06, "loss": 1.1407, "step": 20522 }, { "epoch": 0.62, "learning_rate": 1.679459865527065e-06, "loss": 1.0677, "step": 20523 }, { "epoch": 0.62, "learning_rate": 1.6792294619018434e-06, "loss": 1.2825, "step": 20524 }, { "epoch": 0.62, "learning_rate": 1.6789990660899616e-06, "loss": 1.0065, "step": 20525 }, { "epoch": 0.62, "learning_rate": 1.6787686780936132e-06, "loss": 1.1272, "step": 20526 }, { "epoch": 0.62, "learning_rate": 1.6785382979149917e-06, "loss": 1.1388, "step": 20527 }, { "epoch": 0.62, "learning_rate": 1.6783079255562907e-06, "loss": 1.1566, "step": 20528 }, { "epoch": 0.62, "learning_rate": 1.6780775610197017e-06, "loss": 1.1521, "step": 20529 }, { "epoch": 0.62, "learning_rate": 1.6778472043074185e-06, "loss": 1.1672, "step": 20530 }, { "epoch": 0.62, "learning_rate": 1.6776168554216338e-06, "loss": 1.0753, "step": 20531 }, { "epoch": 0.62, "learning_rate": 1.6773865143645403e-06, "loss": 1.0811, "step": 20532 }, { "epoch": 0.62, "learning_rate": 1.6771561811383325e-06, "loss": 1.0716, "step": 20533 }, { "epoch": 0.62, "learning_rate": 1.6769258557452e-06, "loss": 1.0538, "step": 20534 }, { "epoch": 0.62, "learning_rate": 1.6766955381873373e-06, "loss": 1.1553, "step": 20535 }, { "epoch": 0.62, "learning_rate": 1.676465228466937e-06, "loss": 1.1518, "step": 20536 }, { "epoch": 0.62, "learning_rate": 1.676234926586191e-06, "loss": 1.1971, "step": 20537 }, { "epoch": 0.62, "learning_rate": 1.6760046325472913e-06, "loss": 1.1445, "step": 20538 }, { "epoch": 0.62, "learning_rate": 1.6757743463524312e-06, "loss": 1.1918, "step": 20539 }, { "epoch": 0.62, "learning_rate": 1.6755440680038022e-06, "loss": 1.1251, "step": 20540 }, { "epoch": 0.62, "learning_rate": 1.6753137975035965e-06, "loss": 1.2048, "step": 20541 }, { "epoch": 0.62, "learning_rate": 1.6750835348540062e-06, "loss": 1.098, "step": 20542 }, { "epoch": 0.62, "learning_rate": 1.6748532800572232e-06, "loss": 1.2518, "step": 20543 }, { "epoch": 0.62, "learning_rate": 1.6746230331154394e-06, "loss": 1.3361, "step": 20544 }, { "epoch": 0.62, "learning_rate": 1.6743927940308474e-06, "loss": 1.1293, "step": 20545 }, { "epoch": 0.62, "learning_rate": 1.674162562805639e-06, "loss": 1.0649, "step": 20546 }, { "epoch": 0.62, "learning_rate": 1.6739323394420043e-06, "loss": 1.146, "step": 20547 }, { "epoch": 0.62, "learning_rate": 1.6737021239421358e-06, "loss": 1.2328, "step": 20548 }, { "epoch": 0.62, "learning_rate": 1.673471916308225e-06, "loss": 1.105, "step": 20549 }, { "epoch": 0.62, "learning_rate": 1.6732417165424647e-06, "loss": 1.1097, "step": 20550 }, { "epoch": 0.62, "learning_rate": 1.673011524647044e-06, "loss": 1.0689, "step": 20551 }, { "epoch": 0.62, "learning_rate": 1.6727813406241553e-06, "loss": 1.0952, "step": 20552 }, { "epoch": 0.62, "learning_rate": 1.6725511644759897e-06, "loss": 1.0759, "step": 20553 }, { "epoch": 0.62, "learning_rate": 1.6723209962047393e-06, "loss": 1.0579, "step": 20554 }, { "epoch": 0.62, "learning_rate": 1.6720908358125936e-06, "loss": 1.1349, "step": 20555 }, { "epoch": 0.62, "learning_rate": 1.6718606833017447e-06, "loss": 1.0997, "step": 20556 }, { "epoch": 0.62, "learning_rate": 1.6716305386743831e-06, "loss": 1.1769, "step": 20557 }, { "epoch": 0.62, "learning_rate": 1.6714004019326998e-06, "loss": 1.2271, "step": 20558 }, { "epoch": 0.62, "learning_rate": 1.6711702730788868e-06, "loss": 1.1113, "step": 20559 }, { "epoch": 0.62, "learning_rate": 1.6709401521151325e-06, "loss": 1.0232, "step": 20560 }, { "epoch": 0.62, "learning_rate": 1.6707100390436284e-06, "loss": 1.0388, "step": 20561 }, { "epoch": 0.62, "learning_rate": 1.6704799338665656e-06, "loss": 1.2393, "step": 20562 }, { "epoch": 0.62, "learning_rate": 1.6702498365861352e-06, "loss": 1.0532, "step": 20563 }, { "epoch": 0.62, "learning_rate": 1.670019747204526e-06, "loss": 1.0727, "step": 20564 }, { "epoch": 0.62, "learning_rate": 1.6697896657239288e-06, "loss": 1.1329, "step": 20565 }, { "epoch": 0.62, "learning_rate": 1.669559592146534e-06, "loss": 1.0591, "step": 20566 }, { "epoch": 0.62, "learning_rate": 1.6693295264745329e-06, "loss": 1.1382, "step": 20567 }, { "epoch": 0.62, "learning_rate": 1.6690994687101137e-06, "loss": 1.1035, "step": 20568 }, { "epoch": 0.62, "learning_rate": 1.6688694188554677e-06, "loss": 1.0614, "step": 20569 }, { "epoch": 0.62, "learning_rate": 1.6686393769127842e-06, "loss": 1.0829, "step": 20570 }, { "epoch": 0.62, "learning_rate": 1.6684093428842537e-06, "loss": 1.1363, "step": 20571 }, { "epoch": 0.62, "learning_rate": 1.6681793167720666e-06, "loss": 1.1783, "step": 20572 }, { "epoch": 0.62, "learning_rate": 1.667949298578411e-06, "loss": 1.1328, "step": 20573 }, { "epoch": 0.62, "learning_rate": 1.6677192883054772e-06, "loss": 1.174, "step": 20574 }, { "epoch": 0.62, "learning_rate": 1.667489285955455e-06, "loss": 1.1145, "step": 20575 }, { "epoch": 0.62, "learning_rate": 1.6672592915305346e-06, "loss": 1.1407, "step": 20576 }, { "epoch": 0.62, "learning_rate": 1.667029305032904e-06, "loss": 1.0022, "step": 20577 }, { "epoch": 0.62, "learning_rate": 1.666799326464753e-06, "loss": 1.0821, "step": 20578 }, { "epoch": 0.62, "learning_rate": 1.6665693558282713e-06, "loss": 1.0085, "step": 20579 }, { "epoch": 0.62, "learning_rate": 1.6663393931256485e-06, "loss": 1.1294, "step": 20580 }, { "epoch": 0.62, "learning_rate": 1.6661094383590725e-06, "loss": 1.3506, "step": 20581 }, { "epoch": 0.62, "learning_rate": 1.6658794915307333e-06, "loss": 1.0543, "step": 20582 }, { "epoch": 0.62, "learning_rate": 1.6656495526428196e-06, "loss": 1.1542, "step": 20583 }, { "epoch": 0.62, "learning_rate": 1.6654196216975199e-06, "loss": 1.1168, "step": 20584 }, { "epoch": 0.62, "learning_rate": 1.6651896986970247e-06, "loss": 1.0868, "step": 20585 }, { "epoch": 0.62, "learning_rate": 1.6649597836435204e-06, "loss": 1.1641, "step": 20586 }, { "epoch": 0.62, "learning_rate": 1.664729876539197e-06, "loss": 1.1887, "step": 20587 }, { "epoch": 0.62, "learning_rate": 1.6644999773862427e-06, "loss": 1.1566, "step": 20588 }, { "epoch": 0.62, "learning_rate": 1.6642700861868474e-06, "loss": 1.1129, "step": 20589 }, { "epoch": 0.62, "learning_rate": 1.6640402029431972e-06, "loss": 1.1251, "step": 20590 }, { "epoch": 0.62, "learning_rate": 1.663810327657482e-06, "loss": 1.2083, "step": 20591 }, { "epoch": 0.62, "learning_rate": 1.6635804603318894e-06, "loss": 1.1613, "step": 20592 }, { "epoch": 0.62, "learning_rate": 1.6633506009686084e-06, "loss": 1.2306, "step": 20593 }, { "epoch": 0.62, "learning_rate": 1.6631207495698266e-06, "loss": 1.2046, "step": 20594 }, { "epoch": 0.62, "learning_rate": 1.6628909061377318e-06, "loss": 1.0706, "step": 20595 }, { "epoch": 0.62, "learning_rate": 1.6626610706745127e-06, "loss": 1.153, "step": 20596 }, { "epoch": 0.62, "learning_rate": 1.662431243182358e-06, "loss": 1.1036, "step": 20597 }, { "epoch": 0.62, "learning_rate": 1.6622014236634535e-06, "loss": 1.1254, "step": 20598 }, { "epoch": 0.62, "learning_rate": 1.6619716121199878e-06, "loss": 1.0309, "step": 20599 }, { "epoch": 0.62, "learning_rate": 1.6617418085541486e-06, "loss": 1.2561, "step": 20600 }, { "epoch": 0.62, "learning_rate": 1.661512012968124e-06, "loss": 1.1832, "step": 20601 }, { "epoch": 0.62, "learning_rate": 1.661282225364102e-06, "loss": 1.1546, "step": 20602 }, { "epoch": 0.62, "learning_rate": 1.6610524457442684e-06, "loss": 1.1491, "step": 20603 }, { "epoch": 0.62, "learning_rate": 1.6608226741108113e-06, "loss": 1.1546, "step": 20604 }, { "epoch": 0.62, "learning_rate": 1.660592910465918e-06, "loss": 1.1765, "step": 20605 }, { "epoch": 0.62, "learning_rate": 1.6603631548117767e-06, "loss": 1.321, "step": 20606 }, { "epoch": 0.62, "learning_rate": 1.6601334071505732e-06, "loss": 1.0618, "step": 20607 }, { "epoch": 0.62, "learning_rate": 1.6599036674844955e-06, "loss": 1.0745, "step": 20608 }, { "epoch": 0.62, "learning_rate": 1.65967393581573e-06, "loss": 1.0245, "step": 20609 }, { "epoch": 0.62, "learning_rate": 1.659444212146465e-06, "loss": 1.1068, "step": 20610 }, { "epoch": 0.62, "learning_rate": 1.6592144964788847e-06, "loss": 1.2224, "step": 20611 }, { "epoch": 0.62, "learning_rate": 1.6589847888151784e-06, "loss": 1.0288, "step": 20612 }, { "epoch": 0.62, "learning_rate": 1.6587550891575311e-06, "loss": 1.0158, "step": 20613 }, { "epoch": 0.62, "learning_rate": 1.6585253975081306e-06, "loss": 1.1963, "step": 20614 }, { "epoch": 0.62, "learning_rate": 1.6582957138691639e-06, "loss": 1.0624, "step": 20615 }, { "epoch": 0.62, "learning_rate": 1.6580660382428157e-06, "loss": 1.1561, "step": 20616 }, { "epoch": 0.62, "learning_rate": 1.6578363706312734e-06, "loss": 1.0811, "step": 20617 }, { "epoch": 0.62, "learning_rate": 1.657606711036723e-06, "loss": 1.2802, "step": 20618 }, { "epoch": 0.62, "learning_rate": 1.6573770594613516e-06, "loss": 1.0156, "step": 20619 }, { "epoch": 0.62, "learning_rate": 1.6571474159073442e-06, "loss": 1.1706, "step": 20620 }, { "epoch": 0.62, "learning_rate": 1.6569177803768876e-06, "loss": 1.1688, "step": 20621 }, { "epoch": 0.62, "learning_rate": 1.6566881528721684e-06, "loss": 1.1142, "step": 20622 }, { "epoch": 0.62, "learning_rate": 1.6564585333953714e-06, "loss": 1.0935, "step": 20623 }, { "epoch": 0.62, "learning_rate": 1.6562289219486827e-06, "loss": 1.1658, "step": 20624 }, { "epoch": 0.62, "learning_rate": 1.6559993185342882e-06, "loss": 1.267, "step": 20625 }, { "epoch": 0.62, "learning_rate": 1.6557697231543737e-06, "loss": 1.1319, "step": 20626 }, { "epoch": 0.62, "learning_rate": 1.655540135811125e-06, "loss": 1.0227, "step": 20627 }, { "epoch": 0.62, "learning_rate": 1.6553105565067284e-06, "loss": 1.058, "step": 20628 }, { "epoch": 0.62, "learning_rate": 1.6550809852433674e-06, "loss": 1.1074, "step": 20629 }, { "epoch": 0.62, "learning_rate": 1.6548514220232284e-06, "loss": 1.2101, "step": 20630 }, { "epoch": 0.62, "learning_rate": 1.654621866848497e-06, "loss": 1.2293, "step": 20631 }, { "epoch": 0.62, "learning_rate": 1.6543923197213584e-06, "loss": 1.1075, "step": 20632 }, { "epoch": 0.62, "learning_rate": 1.6541627806439984e-06, "loss": 1.1876, "step": 20633 }, { "epoch": 0.62, "learning_rate": 1.6539332496186002e-06, "loss": 1.2081, "step": 20634 }, { "epoch": 0.62, "learning_rate": 1.6537037266473505e-06, "loss": 1.1216, "step": 20635 }, { "epoch": 0.62, "learning_rate": 1.6534742117324337e-06, "loss": 1.2676, "step": 20636 }, { "epoch": 0.62, "learning_rate": 1.6532447048760348e-06, "loss": 1.0696, "step": 20637 }, { "epoch": 0.62, "learning_rate": 1.6530152060803379e-06, "loss": 1.1919, "step": 20638 }, { "epoch": 0.62, "learning_rate": 1.6527857153475286e-06, "loss": 1.1508, "step": 20639 }, { "epoch": 0.62, "learning_rate": 1.652556232679791e-06, "loss": 1.2732, "step": 20640 }, { "epoch": 0.62, "learning_rate": 1.6523267580793112e-06, "loss": 1.0785, "step": 20641 }, { "epoch": 0.62, "learning_rate": 1.6520972915482713e-06, "loss": 1.135, "step": 20642 }, { "epoch": 0.62, "learning_rate": 1.651867833088857e-06, "loss": 1.1226, "step": 20643 }, { "epoch": 0.62, "learning_rate": 1.6516383827032524e-06, "loss": 1.0162, "step": 20644 }, { "epoch": 0.62, "learning_rate": 1.651408940393643e-06, "loss": 1.031, "step": 20645 }, { "epoch": 0.62, "learning_rate": 1.6511795061622104e-06, "loss": 1.0283, "step": 20646 }, { "epoch": 0.62, "learning_rate": 1.6509500800111403e-06, "loss": 1.1321, "step": 20647 }, { "epoch": 0.62, "learning_rate": 1.6507206619426164e-06, "loss": 1.0995, "step": 20648 }, { "epoch": 0.62, "learning_rate": 1.6504912519588233e-06, "loss": 1.1398, "step": 20649 }, { "epoch": 0.62, "learning_rate": 1.650261850061944e-06, "loss": 1.0372, "step": 20650 }, { "epoch": 0.62, "learning_rate": 1.6500324562541625e-06, "loss": 1.1115, "step": 20651 }, { "epoch": 0.62, "learning_rate": 1.6498030705376628e-06, "loss": 1.1276, "step": 20652 }, { "epoch": 0.62, "learning_rate": 1.649573692914628e-06, "loss": 1.0811, "step": 20653 }, { "epoch": 0.62, "learning_rate": 1.6493443233872435e-06, "loss": 1.2594, "step": 20654 }, { "epoch": 0.62, "learning_rate": 1.6491149619576901e-06, "loss": 1.1448, "step": 20655 }, { "epoch": 0.62, "learning_rate": 1.6488856086281523e-06, "loss": 1.1625, "step": 20656 }, { "epoch": 0.62, "learning_rate": 1.6486562634008141e-06, "loss": 1.0806, "step": 20657 }, { "epoch": 0.62, "learning_rate": 1.648426926277859e-06, "loss": 1.085, "step": 20658 }, { "epoch": 0.62, "learning_rate": 1.6481975972614683e-06, "loss": 1.1081, "step": 20659 }, { "epoch": 0.62, "learning_rate": 1.6479682763538263e-06, "loss": 1.1102, "step": 20660 }, { "epoch": 0.62, "learning_rate": 1.6477389635571161e-06, "loss": 1.2875, "step": 20661 }, { "epoch": 0.62, "learning_rate": 1.6475096588735211e-06, "loss": 1.0178, "step": 20662 }, { "epoch": 0.62, "learning_rate": 1.6472803623052228e-06, "loss": 1.135, "step": 20663 }, { "epoch": 0.62, "learning_rate": 1.6470510738544048e-06, "loss": 1.0337, "step": 20664 }, { "epoch": 0.62, "learning_rate": 1.64682179352325e-06, "loss": 1.1421, "step": 20665 }, { "epoch": 0.62, "learning_rate": 1.6465925213139406e-06, "loss": 1.1156, "step": 20666 }, { "epoch": 0.62, "learning_rate": 1.6463632572286604e-06, "loss": 1.029, "step": 20667 }, { "epoch": 0.62, "learning_rate": 1.6461340012695898e-06, "loss": 1.1249, "step": 20668 }, { "epoch": 0.62, "learning_rate": 1.6459047534389125e-06, "loss": 1.0874, "step": 20669 }, { "epoch": 0.62, "learning_rate": 1.6456755137388105e-06, "loss": 1.2084, "step": 20670 }, { "epoch": 0.62, "learning_rate": 1.6454462821714673e-06, "loss": 1.0551, "step": 20671 }, { "epoch": 0.62, "learning_rate": 1.6452170587390625e-06, "loss": 1.009, "step": 20672 }, { "epoch": 0.62, "learning_rate": 1.64498784344378e-06, "loss": 1.1467, "step": 20673 }, { "epoch": 0.62, "learning_rate": 1.6447586362878015e-06, "loss": 1.2963, "step": 20674 }, { "epoch": 0.62, "learning_rate": 1.644529437273309e-06, "loss": 1.0593, "step": 20675 }, { "epoch": 0.62, "learning_rate": 1.6443002464024841e-06, "loss": 1.0727, "step": 20676 }, { "epoch": 0.62, "learning_rate": 1.6440710636775086e-06, "loss": 1.0885, "step": 20677 }, { "epoch": 0.62, "learning_rate": 1.6438418891005643e-06, "loss": 1.0236, "step": 20678 }, { "epoch": 0.62, "learning_rate": 1.643612722673833e-06, "loss": 1.1366, "step": 20679 }, { "epoch": 0.62, "learning_rate": 1.6433835643994968e-06, "loss": 1.0717, "step": 20680 }, { "epoch": 0.62, "learning_rate": 1.643154414279736e-06, "loss": 1.1678, "step": 20681 }, { "epoch": 0.62, "learning_rate": 1.6429252723167323e-06, "loss": 1.0205, "step": 20682 }, { "epoch": 0.62, "learning_rate": 1.6426961385126673e-06, "loss": 1.2291, "step": 20683 }, { "epoch": 0.62, "learning_rate": 1.642467012869723e-06, "loss": 1.0876, "step": 20684 }, { "epoch": 0.62, "learning_rate": 1.6422378953900786e-06, "loss": 1.0847, "step": 20685 }, { "epoch": 0.62, "learning_rate": 1.6420087860759166e-06, "loss": 1.0652, "step": 20686 }, { "epoch": 0.62, "learning_rate": 1.6417796849294176e-06, "loss": 1.2084, "step": 20687 }, { "epoch": 0.62, "learning_rate": 1.641550591952763e-06, "loss": 1.0186, "step": 20688 }, { "epoch": 0.62, "learning_rate": 1.6413215071481332e-06, "loss": 1.1705, "step": 20689 }, { "epoch": 0.62, "learning_rate": 1.641092430517709e-06, "loss": 1.1496, "step": 20690 }, { "epoch": 0.62, "learning_rate": 1.640863362063671e-06, "loss": 1.119, "step": 20691 }, { "epoch": 0.62, "learning_rate": 1.6406343017882004e-06, "loss": 1.0247, "step": 20692 }, { "epoch": 0.62, "learning_rate": 1.640405249693478e-06, "loss": 1.2053, "step": 20693 }, { "epoch": 0.62, "learning_rate": 1.6401762057816828e-06, "loss": 1.021, "step": 20694 }, { "epoch": 0.62, "learning_rate": 1.6399471700549957e-06, "loss": 1.0746, "step": 20695 }, { "epoch": 0.62, "learning_rate": 1.6397181425155977e-06, "loss": 1.1463, "step": 20696 }, { "epoch": 0.62, "learning_rate": 1.6394891231656694e-06, "loss": 1.0364, "step": 20697 }, { "epoch": 0.62, "learning_rate": 1.6392601120073896e-06, "loss": 1.1656, "step": 20698 }, { "epoch": 0.62, "learning_rate": 1.6390311090429386e-06, "loss": 1.2449, "step": 20699 }, { "epoch": 0.62, "learning_rate": 1.638802114274497e-06, "loss": 1.0572, "step": 20700 }, { "epoch": 0.62, "learning_rate": 1.638573127704245e-06, "loss": 1.1092, "step": 20701 }, { "epoch": 0.62, "learning_rate": 1.6383441493343614e-06, "loss": 1.1133, "step": 20702 }, { "epoch": 0.62, "learning_rate": 1.6381151791670264e-06, "loss": 1.1445, "step": 20703 }, { "epoch": 0.62, "learning_rate": 1.6378862172044203e-06, "loss": 1.1227, "step": 20704 }, { "epoch": 0.62, "learning_rate": 1.637657263448722e-06, "loss": 1.095, "step": 20705 }, { "epoch": 0.62, "learning_rate": 1.6374283179021114e-06, "loss": 1.1878, "step": 20706 }, { "epoch": 0.62, "learning_rate": 1.6371993805667674e-06, "loss": 1.1207, "step": 20707 }, { "epoch": 0.62, "learning_rate": 1.6369704514448698e-06, "loss": 0.9993, "step": 20708 }, { "epoch": 0.62, "learning_rate": 1.6367415305385976e-06, "loss": 1.199, "step": 20709 }, { "epoch": 0.62, "learning_rate": 1.6365126178501317e-06, "loss": 1.1639, "step": 20710 }, { "epoch": 0.62, "learning_rate": 1.6362837133816483e-06, "loss": 1.133, "step": 20711 }, { "epoch": 0.62, "learning_rate": 1.6360548171353285e-06, "loss": 1.0903, "step": 20712 }, { "epoch": 0.62, "learning_rate": 1.6358259291133504e-06, "loss": 1.0027, "step": 20713 }, { "epoch": 0.62, "learning_rate": 1.635597049317894e-06, "loss": 1.0969, "step": 20714 }, { "epoch": 0.62, "learning_rate": 1.635368177751137e-06, "loss": 0.9799, "step": 20715 }, { "epoch": 0.62, "learning_rate": 1.6351393144152582e-06, "loss": 1.109, "step": 20716 }, { "epoch": 0.62, "learning_rate": 1.6349104593124371e-06, "loss": 1.1699, "step": 20717 }, { "epoch": 0.62, "learning_rate": 1.6346816124448511e-06, "loss": 1.0736, "step": 20718 }, { "epoch": 0.62, "learning_rate": 1.6344527738146804e-06, "loss": 1.1418, "step": 20719 }, { "epoch": 0.62, "learning_rate": 1.6342239434241014e-06, "loss": 1.1236, "step": 20720 }, { "epoch": 0.62, "learning_rate": 1.6339951212752939e-06, "loss": 1.1028, "step": 20721 }, { "epoch": 0.62, "learning_rate": 1.6337663073704357e-06, "loss": 1.0975, "step": 20722 }, { "epoch": 0.62, "learning_rate": 1.6335375017117062e-06, "loss": 1.0668, "step": 20723 }, { "epoch": 0.62, "learning_rate": 1.6333087043012808e-06, "loss": 1.0222, "step": 20724 }, { "epoch": 0.62, "learning_rate": 1.6330799151413395e-06, "loss": 1.3018, "step": 20725 }, { "epoch": 0.62, "learning_rate": 1.63285113423406e-06, "loss": 1.0915, "step": 20726 }, { "epoch": 0.62, "learning_rate": 1.632622361581621e-06, "loss": 1.027, "step": 20727 }, { "epoch": 0.62, "learning_rate": 1.6323935971861982e-06, "loss": 1.0916, "step": 20728 }, { "epoch": 0.62, "learning_rate": 1.6321648410499708e-06, "loss": 1.1973, "step": 20729 }, { "epoch": 0.62, "learning_rate": 1.631936093175116e-06, "loss": 1.2028, "step": 20730 }, { "epoch": 0.62, "learning_rate": 1.6317073535638113e-06, "loss": 1.0401, "step": 20731 }, { "epoch": 0.62, "learning_rate": 1.631478622218235e-06, "loss": 1.0579, "step": 20732 }, { "epoch": 0.62, "learning_rate": 1.6312498991405636e-06, "loss": 1.1409, "step": 20733 }, { "epoch": 0.62, "learning_rate": 1.631021184332975e-06, "loss": 1.0306, "step": 20734 }, { "epoch": 0.62, "learning_rate": 1.6307924777976455e-06, "loss": 1.1142, "step": 20735 }, { "epoch": 0.62, "learning_rate": 1.6305637795367545e-06, "loss": 1.0988, "step": 20736 }, { "epoch": 0.62, "learning_rate": 1.6303350895524766e-06, "loss": 1.1965, "step": 20737 }, { "epoch": 0.62, "learning_rate": 1.6301064078469897e-06, "loss": 1.0605, "step": 20738 }, { "epoch": 0.62, "learning_rate": 1.6298777344224706e-06, "loss": 1.1545, "step": 20739 }, { "epoch": 0.62, "learning_rate": 1.6296490692810979e-06, "loss": 1.0445, "step": 20740 }, { "epoch": 0.62, "learning_rate": 1.6294204124250453e-06, "loss": 1.1274, "step": 20741 }, { "epoch": 0.62, "learning_rate": 1.6291917638564914e-06, "loss": 1.1202, "step": 20742 }, { "epoch": 0.62, "learning_rate": 1.6289631235776127e-06, "loss": 1.1221, "step": 20743 }, { "epoch": 0.62, "learning_rate": 1.628734491590585e-06, "loss": 1.2371, "step": 20744 }, { "epoch": 0.62, "learning_rate": 1.6285058678975862e-06, "loss": 1.0919, "step": 20745 }, { "epoch": 0.62, "learning_rate": 1.6282772525007915e-06, "loss": 1.2288, "step": 20746 }, { "epoch": 0.63, "learning_rate": 1.6280486454023772e-06, "loss": 1.1461, "step": 20747 }, { "epoch": 0.63, "learning_rate": 1.6278200466045202e-06, "loss": 1.1207, "step": 20748 }, { "epoch": 0.63, "learning_rate": 1.6275914561093969e-06, "loss": 1.0553, "step": 20749 }, { "epoch": 0.63, "learning_rate": 1.6273628739191821e-06, "loss": 0.9282, "step": 20750 }, { "epoch": 0.63, "learning_rate": 1.6271343000360522e-06, "loss": 1.1493, "step": 20751 }, { "epoch": 0.63, "learning_rate": 1.6269057344621836e-06, "loss": 1.1035, "step": 20752 }, { "epoch": 0.63, "learning_rate": 1.6266771771997525e-06, "loss": 1.1111, "step": 20753 }, { "epoch": 0.63, "learning_rate": 1.6264486282509335e-06, "loss": 1.0629, "step": 20754 }, { "epoch": 0.63, "learning_rate": 1.6262200876179026e-06, "loss": 1.1324, "step": 20755 }, { "epoch": 0.63, "learning_rate": 1.6259915553028358e-06, "loss": 1.2769, "step": 20756 }, { "epoch": 0.63, "learning_rate": 1.6257630313079083e-06, "loss": 1.1312, "step": 20757 }, { "epoch": 0.63, "learning_rate": 1.6255345156352964e-06, "loss": 1.1519, "step": 20758 }, { "epoch": 0.63, "learning_rate": 1.6253060082871741e-06, "loss": 0.9642, "step": 20759 }, { "epoch": 0.63, "learning_rate": 1.6250775092657174e-06, "loss": 1.0139, "step": 20760 }, { "epoch": 0.63, "learning_rate": 1.6248490185731015e-06, "loss": 1.1042, "step": 20761 }, { "epoch": 0.63, "learning_rate": 1.6246205362115023e-06, "loss": 1.1234, "step": 20762 }, { "epoch": 0.63, "learning_rate": 1.624392062183093e-06, "loss": 1.0893, "step": 20763 }, { "epoch": 0.63, "learning_rate": 1.6241635964900496e-06, "loss": 1.1453, "step": 20764 }, { "epoch": 0.63, "learning_rate": 1.623935139134547e-06, "loss": 1.0034, "step": 20765 }, { "epoch": 0.63, "learning_rate": 1.623706690118761e-06, "loss": 1.0804, "step": 20766 }, { "epoch": 0.63, "learning_rate": 1.6234782494448642e-06, "loss": 1.1604, "step": 20767 }, { "epoch": 0.63, "learning_rate": 1.6232498171150323e-06, "loss": 1.1227, "step": 20768 }, { "epoch": 0.63, "learning_rate": 1.6230213931314398e-06, "loss": 1.0143, "step": 20769 }, { "epoch": 0.63, "learning_rate": 1.6227929774962613e-06, "loss": 0.9989, "step": 20770 }, { "epoch": 0.63, "learning_rate": 1.6225645702116716e-06, "loss": 1.1246, "step": 20771 }, { "epoch": 0.63, "learning_rate": 1.6223361712798444e-06, "loss": 1.1011, "step": 20772 }, { "epoch": 0.63, "learning_rate": 1.6221077807029539e-06, "loss": 1.185, "step": 20773 }, { "epoch": 0.63, "learning_rate": 1.6218793984831748e-06, "loss": 1.1401, "step": 20774 }, { "epoch": 0.63, "learning_rate": 1.6216510246226815e-06, "loss": 1.155, "step": 20775 }, { "epoch": 0.63, "learning_rate": 1.6214226591236467e-06, "loss": 1.0698, "step": 20776 }, { "epoch": 0.63, "learning_rate": 1.621194301988245e-06, "loss": 1.0639, "step": 20777 }, { "epoch": 0.63, "learning_rate": 1.6209659532186502e-06, "loss": 1.1216, "step": 20778 }, { "epoch": 0.63, "learning_rate": 1.6207376128170375e-06, "loss": 1.1492, "step": 20779 }, { "epoch": 0.63, "learning_rate": 1.620509280785578e-06, "loss": 1.1499, "step": 20780 }, { "epoch": 0.63, "learning_rate": 1.6202809571264466e-06, "loss": 1.2648, "step": 20781 }, { "epoch": 0.63, "learning_rate": 1.6200526418418167e-06, "loss": 1.0879, "step": 20782 }, { "epoch": 0.63, "learning_rate": 1.6198243349338624e-06, "loss": 1.0479, "step": 20783 }, { "epoch": 0.63, "learning_rate": 1.6195960364047561e-06, "loss": 1.0274, "step": 20784 }, { "epoch": 0.63, "learning_rate": 1.6193677462566715e-06, "loss": 1.1365, "step": 20785 }, { "epoch": 0.63, "learning_rate": 1.6191394644917823e-06, "loss": 1.0763, "step": 20786 }, { "epoch": 0.63, "learning_rate": 1.6189111911122608e-06, "loss": 1.1938, "step": 20787 }, { "epoch": 0.63, "learning_rate": 1.6186829261202808e-06, "loss": 1.0224, "step": 20788 }, { "epoch": 0.63, "learning_rate": 1.6184546695180143e-06, "loss": 1.1277, "step": 20789 }, { "epoch": 0.63, "learning_rate": 1.6182264213076348e-06, "loss": 1.1766, "step": 20790 }, { "epoch": 0.63, "learning_rate": 1.6179981814913148e-06, "loss": 1.0624, "step": 20791 }, { "epoch": 0.63, "learning_rate": 1.6177699500712292e-06, "loss": 1.1085, "step": 20792 }, { "epoch": 0.63, "learning_rate": 1.617541727049547e-06, "loss": 0.9952, "step": 20793 }, { "epoch": 0.63, "learning_rate": 1.6173135124284429e-06, "loss": 1.2997, "step": 20794 }, { "epoch": 0.63, "learning_rate": 1.617085306210089e-06, "loss": 1.1051, "step": 20795 }, { "epoch": 0.63, "learning_rate": 1.6168571083966577e-06, "loss": 1.0735, "step": 20796 }, { "epoch": 0.63, "learning_rate": 1.6166289189903223e-06, "loss": 1.1087, "step": 20797 }, { "epoch": 0.63, "learning_rate": 1.616400737993253e-06, "loss": 1.1505, "step": 20798 }, { "epoch": 0.63, "learning_rate": 1.6161725654076236e-06, "loss": 1.2211, "step": 20799 }, { "epoch": 0.63, "learning_rate": 1.615944401235605e-06, "loss": 1.186, "step": 20800 }, { "epoch": 0.63, "learning_rate": 1.6157162454793713e-06, "loss": 1.1853, "step": 20801 }, { "epoch": 0.63, "learning_rate": 1.615488098141092e-06, "loss": 1.1893, "step": 20802 }, { "epoch": 0.63, "learning_rate": 1.61525995922294e-06, "loss": 1.0496, "step": 20803 }, { "epoch": 0.63, "learning_rate": 1.6150318287270874e-06, "loss": 1.1453, "step": 20804 }, { "epoch": 0.63, "learning_rate": 1.6148037066557065e-06, "loss": 1.2557, "step": 20805 }, { "epoch": 0.63, "learning_rate": 1.6145755930109668e-06, "loss": 1.1957, "step": 20806 }, { "epoch": 0.63, "learning_rate": 1.614347487795041e-06, "loss": 1.0755, "step": 20807 }, { "epoch": 0.63, "learning_rate": 1.6141193910101007e-06, "loss": 1.0626, "step": 20808 }, { "epoch": 0.63, "learning_rate": 1.6138913026583184e-06, "loss": 1.0321, "step": 20809 }, { "epoch": 0.63, "learning_rate": 1.6136632227418627e-06, "loss": 1.0884, "step": 20810 }, { "epoch": 0.63, "learning_rate": 1.6134351512629065e-06, "loss": 1.1382, "step": 20811 }, { "epoch": 0.63, "learning_rate": 1.6132070882236207e-06, "loss": 1.2062, "step": 20812 }, { "epoch": 0.63, "learning_rate": 1.612979033626176e-06, "loss": 1.1064, "step": 20813 }, { "epoch": 0.63, "learning_rate": 1.6127509874727446e-06, "loss": 1.0576, "step": 20814 }, { "epoch": 0.63, "learning_rate": 1.6125229497654956e-06, "loss": 0.9991, "step": 20815 }, { "epoch": 0.63, "learning_rate": 1.612294920506601e-06, "loss": 1.2234, "step": 20816 }, { "epoch": 0.63, "learning_rate": 1.6120668996982312e-06, "loss": 1.2117, "step": 20817 }, { "epoch": 0.63, "learning_rate": 1.6118388873425578e-06, "loss": 1.1923, "step": 20818 }, { "epoch": 0.63, "learning_rate": 1.6116108834417492e-06, "loss": 1.1642, "step": 20819 }, { "epoch": 0.63, "learning_rate": 1.6113828879979776e-06, "loss": 1.1511, "step": 20820 }, { "epoch": 0.63, "learning_rate": 1.6111549010134125e-06, "loss": 1.1719, "step": 20821 }, { "epoch": 0.63, "learning_rate": 1.6109269224902258e-06, "loss": 0.9404, "step": 20822 }, { "epoch": 0.63, "learning_rate": 1.6106989524305857e-06, "loss": 1.0604, "step": 20823 }, { "epoch": 0.63, "learning_rate": 1.6104709908366634e-06, "loss": 1.1924, "step": 20824 }, { "epoch": 0.63, "learning_rate": 1.6102430377106287e-06, "loss": 1.2078, "step": 20825 }, { "epoch": 0.63, "learning_rate": 1.6100150930546515e-06, "loss": 1.1255, "step": 20826 }, { "epoch": 0.63, "learning_rate": 1.6097871568709028e-06, "loss": 1.1358, "step": 20827 }, { "epoch": 0.63, "learning_rate": 1.609559229161551e-06, "loss": 1.2499, "step": 20828 }, { "epoch": 0.63, "learning_rate": 1.6093313099287667e-06, "loss": 1.0754, "step": 20829 }, { "epoch": 0.63, "learning_rate": 1.609103399174719e-06, "loss": 1.172, "step": 20830 }, { "epoch": 0.63, "learning_rate": 1.6088754969015791e-06, "loss": 1.1371, "step": 20831 }, { "epoch": 0.63, "learning_rate": 1.6086476031115146e-06, "loss": 1.0791, "step": 20832 }, { "epoch": 0.63, "learning_rate": 1.608419717806695e-06, "loss": 1.1041, "step": 20833 }, { "epoch": 0.63, "learning_rate": 1.6081918409892904e-06, "loss": 1.1971, "step": 20834 }, { "epoch": 0.63, "learning_rate": 1.6079639726614716e-06, "loss": 1.0802, "step": 20835 }, { "epoch": 0.63, "learning_rate": 1.6077361128254044e-06, "loss": 1.1248, "step": 20836 }, { "epoch": 0.63, "learning_rate": 1.60750826148326e-06, "loss": 1.1147, "step": 20837 }, { "epoch": 0.63, "learning_rate": 1.6072804186372072e-06, "loss": 1.1087, "step": 20838 }, { "epoch": 0.63, "learning_rate": 1.6070525842894146e-06, "loss": 1.1169, "step": 20839 }, { "epoch": 0.63, "learning_rate": 1.6068247584420521e-06, "loss": 1.0674, "step": 20840 }, { "epoch": 0.63, "learning_rate": 1.606596941097287e-06, "loss": 1.1893, "step": 20841 }, { "epoch": 0.63, "learning_rate": 1.6063691322572888e-06, "loss": 1.0522, "step": 20842 }, { "epoch": 0.63, "learning_rate": 1.6061413319242263e-06, "loss": 1.1133, "step": 20843 }, { "epoch": 0.63, "learning_rate": 1.6059135401002685e-06, "loss": 1.2883, "step": 20844 }, { "epoch": 0.63, "learning_rate": 1.6056857567875824e-06, "loss": 1.1417, "step": 20845 }, { "epoch": 0.63, "learning_rate": 1.6054579819883374e-06, "loss": 1.1047, "step": 20846 }, { "epoch": 0.63, "learning_rate": 1.6052302157047013e-06, "loss": 1.2097, "step": 20847 }, { "epoch": 0.63, "learning_rate": 1.6050024579388435e-06, "loss": 1.0649, "step": 20848 }, { "epoch": 0.63, "learning_rate": 1.6047747086929306e-06, "loss": 1.1509, "step": 20849 }, { "epoch": 0.63, "learning_rate": 1.604546967969131e-06, "loss": 1.0778, "step": 20850 }, { "epoch": 0.63, "learning_rate": 1.6043192357696131e-06, "loss": 1.0065, "step": 20851 }, { "epoch": 0.63, "learning_rate": 1.6040915120965445e-06, "loss": 1.0954, "step": 20852 }, { "epoch": 0.63, "learning_rate": 1.603863796952094e-06, "loss": 1.0944, "step": 20853 }, { "epoch": 0.63, "learning_rate": 1.603636090338428e-06, "loss": 1.2009, "step": 20854 }, { "epoch": 0.63, "learning_rate": 1.6034083922577148e-06, "loss": 1.1616, "step": 20855 }, { "epoch": 0.63, "learning_rate": 1.6031807027121216e-06, "loss": 1.0681, "step": 20856 }, { "epoch": 0.63, "learning_rate": 1.6029530217038176e-06, "loss": 1.0759, "step": 20857 }, { "epoch": 0.63, "learning_rate": 1.6027253492349676e-06, "loss": 1.1026, "step": 20858 }, { "epoch": 0.63, "learning_rate": 1.60249768530774e-06, "loss": 1.1077, "step": 20859 }, { "epoch": 0.63, "learning_rate": 1.6022700299243022e-06, "loss": 1.1705, "step": 20860 }, { "epoch": 0.63, "learning_rate": 1.6020423830868226e-06, "loss": 1.1505, "step": 20861 }, { "epoch": 0.63, "learning_rate": 1.6018147447974658e-06, "loss": 1.095, "step": 20862 }, { "epoch": 0.63, "learning_rate": 1.6015871150584e-06, "loss": 1.0161, "step": 20863 }, { "epoch": 0.63, "learning_rate": 1.6013594938717925e-06, "loss": 0.9828, "step": 20864 }, { "epoch": 0.63, "learning_rate": 1.6011318812398096e-06, "loss": 1.0673, "step": 20865 }, { "epoch": 0.63, "learning_rate": 1.6009042771646189e-06, "loss": 1.0803, "step": 20866 }, { "epoch": 0.63, "learning_rate": 1.600676681648386e-06, "loss": 1.1875, "step": 20867 }, { "epoch": 0.63, "learning_rate": 1.6004490946932782e-06, "loss": 1.0597, "step": 20868 }, { "epoch": 0.63, "learning_rate": 1.6002215163014612e-06, "loss": 1.1159, "step": 20869 }, { "epoch": 0.63, "learning_rate": 1.5999939464751029e-06, "loss": 1.128, "step": 20870 }, { "epoch": 0.63, "learning_rate": 1.599766385216368e-06, "loss": 1.1103, "step": 20871 }, { "epoch": 0.63, "learning_rate": 1.5995388325274236e-06, "loss": 1.1393, "step": 20872 }, { "epoch": 0.63, "learning_rate": 1.5993112884104361e-06, "loss": 1.064, "step": 20873 }, { "epoch": 0.63, "learning_rate": 1.599083752867572e-06, "loss": 1.1253, "step": 20874 }, { "epoch": 0.63, "learning_rate": 1.598856225900996e-06, "loss": 1.202, "step": 20875 }, { "epoch": 0.63, "learning_rate": 1.5986287075128743e-06, "loss": 1.0526, "step": 20876 }, { "epoch": 0.63, "learning_rate": 1.5984011977053737e-06, "loss": 1.1811, "step": 20877 }, { "epoch": 0.63, "learning_rate": 1.598173696480659e-06, "loss": 1.0847, "step": 20878 }, { "epoch": 0.63, "learning_rate": 1.5979462038408977e-06, "loss": 1.1459, "step": 20879 }, { "epoch": 0.63, "learning_rate": 1.5977187197882529e-06, "loss": 1.1592, "step": 20880 }, { "epoch": 0.63, "learning_rate": 1.5974912443248913e-06, "loss": 1.1102, "step": 20881 }, { "epoch": 0.63, "learning_rate": 1.5972637774529788e-06, "loss": 1.174, "step": 20882 }, { "epoch": 0.63, "learning_rate": 1.5970363191746805e-06, "loss": 1.0474, "step": 20883 }, { "epoch": 0.63, "learning_rate": 1.596808869492161e-06, "loss": 1.1772, "step": 20884 }, { "epoch": 0.63, "learning_rate": 1.5965814284075862e-06, "loss": 1.1298, "step": 20885 }, { "epoch": 0.63, "learning_rate": 1.596353995923121e-06, "loss": 1.1747, "step": 20886 }, { "epoch": 0.63, "learning_rate": 1.596126572040932e-06, "loss": 1.116, "step": 20887 }, { "epoch": 0.63, "learning_rate": 1.5958991567631809e-06, "loss": 1.0175, "step": 20888 }, { "epoch": 0.63, "learning_rate": 1.5956717500920348e-06, "loss": 1.117, "step": 20889 }, { "epoch": 0.63, "learning_rate": 1.5954443520296584e-06, "loss": 1.0201, "step": 20890 }, { "epoch": 0.63, "learning_rate": 1.595216962578216e-06, "loss": 1.0742, "step": 20891 }, { "epoch": 0.63, "learning_rate": 1.594989581739873e-06, "loss": 1.1682, "step": 20892 }, { "epoch": 0.63, "learning_rate": 1.5947622095167926e-06, "loss": 1.1078, "step": 20893 }, { "epoch": 0.63, "learning_rate": 1.5945348459111398e-06, "loss": 1.1151, "step": 20894 }, { "epoch": 0.63, "learning_rate": 1.5943074909250794e-06, "loss": 1.1, "step": 20895 }, { "epoch": 0.63, "learning_rate": 1.594080144560776e-06, "loss": 1.1376, "step": 20896 }, { "epoch": 0.63, "learning_rate": 1.5938528068203927e-06, "loss": 1.12, "step": 20897 }, { "epoch": 0.63, "learning_rate": 1.5936254777060944e-06, "loss": 1.1473, "step": 20898 }, { "epoch": 0.63, "learning_rate": 1.5933981572200446e-06, "loss": 1.1165, "step": 20899 }, { "epoch": 0.63, "learning_rate": 1.593170845364409e-06, "loss": 1.2193, "step": 20900 }, { "epoch": 0.63, "learning_rate": 1.5929435421413495e-06, "loss": 1.182, "step": 20901 }, { "epoch": 0.63, "learning_rate": 1.5927162475530303e-06, "loss": 1.1072, "step": 20902 }, { "epoch": 0.63, "learning_rate": 1.5924889616016154e-06, "loss": 1.0954, "step": 20903 }, { "epoch": 0.63, "learning_rate": 1.5922616842892684e-06, "loss": 1.0984, "step": 20904 }, { "epoch": 0.63, "learning_rate": 1.5920344156181545e-06, "loss": 1.1656, "step": 20905 }, { "epoch": 0.63, "learning_rate": 1.5918071555904344e-06, "loss": 1.295, "step": 20906 }, { "epoch": 0.63, "learning_rate": 1.5915799042082728e-06, "loss": 1.1141, "step": 20907 }, { "epoch": 0.63, "learning_rate": 1.5913526614738328e-06, "loss": 1.1277, "step": 20908 }, { "epoch": 0.63, "learning_rate": 1.5911254273892785e-06, "loss": 1.0248, "step": 20909 }, { "epoch": 0.63, "learning_rate": 1.590898201956772e-06, "loss": 1.0494, "step": 20910 }, { "epoch": 0.63, "learning_rate": 1.5906709851784768e-06, "loss": 1.2122, "step": 20911 }, { "epoch": 0.63, "learning_rate": 1.5904437770565557e-06, "loss": 1.1796, "step": 20912 }, { "epoch": 0.63, "learning_rate": 1.5902165775931727e-06, "loss": 1.1287, "step": 20913 }, { "epoch": 0.63, "learning_rate": 1.589989386790489e-06, "loss": 1.1038, "step": 20914 }, { "epoch": 0.63, "learning_rate": 1.5897622046506678e-06, "loss": 1.1021, "step": 20915 }, { "epoch": 0.63, "learning_rate": 1.5895350311758723e-06, "loss": 1.1649, "step": 20916 }, { "epoch": 0.63, "learning_rate": 1.5893078663682646e-06, "loss": 1.077, "step": 20917 }, { "epoch": 0.63, "learning_rate": 1.5890807102300085e-06, "loss": 1.1151, "step": 20918 }, { "epoch": 0.63, "learning_rate": 1.5888535627632642e-06, "loss": 1.1143, "step": 20919 }, { "epoch": 0.63, "learning_rate": 1.5886264239701953e-06, "loss": 1.1523, "step": 20920 }, { "epoch": 0.63, "learning_rate": 1.5883992938529639e-06, "loss": 1.0549, "step": 20921 }, { "epoch": 0.63, "learning_rate": 1.5881721724137328e-06, "loss": 1.1741, "step": 20922 }, { "epoch": 0.63, "learning_rate": 1.5879450596546626e-06, "loss": 1.1847, "step": 20923 }, { "epoch": 0.63, "learning_rate": 1.5877179555779165e-06, "loss": 1.1355, "step": 20924 }, { "epoch": 0.63, "learning_rate": 1.587490860185656e-06, "loss": 1.1067, "step": 20925 }, { "epoch": 0.63, "learning_rate": 1.5872637734800439e-06, "loss": 1.058, "step": 20926 }, { "epoch": 0.63, "learning_rate": 1.5870366954632402e-06, "loss": 1.1423, "step": 20927 }, { "epoch": 0.63, "learning_rate": 1.5868096261374071e-06, "loss": 1.0383, "step": 20928 }, { "epoch": 0.63, "learning_rate": 1.5865825655047073e-06, "loss": 1.1082, "step": 20929 }, { "epoch": 0.63, "learning_rate": 1.5863555135673008e-06, "loss": 1.1346, "step": 20930 }, { "epoch": 0.63, "learning_rate": 1.5861284703273514e-06, "loss": 1.1755, "step": 20931 }, { "epoch": 0.63, "learning_rate": 1.5859014357870176e-06, "loss": 1.0244, "step": 20932 }, { "epoch": 0.63, "learning_rate": 1.5856744099484617e-06, "loss": 1.1313, "step": 20933 }, { "epoch": 0.63, "learning_rate": 1.5854473928138452e-06, "loss": 1.1688, "step": 20934 }, { "epoch": 0.63, "learning_rate": 1.5852203843853298e-06, "loss": 1.181, "step": 20935 }, { "epoch": 0.63, "learning_rate": 1.584993384665075e-06, "loss": 1.0555, "step": 20936 }, { "epoch": 0.63, "learning_rate": 1.5847663936552427e-06, "loss": 1.2039, "step": 20937 }, { "epoch": 0.63, "learning_rate": 1.5845394113579931e-06, "loss": 1.1519, "step": 20938 }, { "epoch": 0.63, "learning_rate": 1.5843124377754887e-06, "loss": 1.0216, "step": 20939 }, { "epoch": 0.63, "learning_rate": 1.5840854729098881e-06, "loss": 1.0601, "step": 20940 }, { "epoch": 0.63, "learning_rate": 1.5838585167633525e-06, "loss": 1.2139, "step": 20941 }, { "epoch": 0.63, "learning_rate": 1.5836315693380422e-06, "loss": 1.1111, "step": 20942 }, { "epoch": 0.63, "learning_rate": 1.5834046306361184e-06, "loss": 1.153, "step": 20943 }, { "epoch": 0.63, "learning_rate": 1.583177700659742e-06, "loss": 1.2159, "step": 20944 }, { "epoch": 0.63, "learning_rate": 1.5829507794110716e-06, "loss": 1.1591, "step": 20945 }, { "epoch": 0.63, "learning_rate": 1.582723866892268e-06, "loss": 1.0974, "step": 20946 }, { "epoch": 0.63, "learning_rate": 1.582496963105491e-06, "loss": 1.0943, "step": 20947 }, { "epoch": 0.63, "learning_rate": 1.5822700680529018e-06, "loss": 1.1465, "step": 20948 }, { "epoch": 0.63, "learning_rate": 1.5820431817366591e-06, "loss": 1.1669, "step": 20949 }, { "epoch": 0.63, "learning_rate": 1.5818163041589232e-06, "loss": 1.1115, "step": 20950 }, { "epoch": 0.63, "learning_rate": 1.5815894353218542e-06, "loss": 1.1812, "step": 20951 }, { "epoch": 0.63, "learning_rate": 1.5813625752276118e-06, "loss": 1.1049, "step": 20952 }, { "epoch": 0.63, "learning_rate": 1.5811357238783546e-06, "loss": 0.9398, "step": 20953 }, { "epoch": 0.63, "learning_rate": 1.5809088812762428e-06, "loss": 1.2678, "step": 20954 }, { "epoch": 0.63, "learning_rate": 1.5806820474234355e-06, "loss": 1.2136, "step": 20955 }, { "epoch": 0.63, "learning_rate": 1.5804552223220927e-06, "loss": 1.1293, "step": 20956 }, { "epoch": 0.63, "learning_rate": 1.5802284059743741e-06, "loss": 1.0716, "step": 20957 }, { "epoch": 0.63, "learning_rate": 1.5800015983824375e-06, "loss": 1.1602, "step": 20958 }, { "epoch": 0.63, "learning_rate": 1.5797747995484418e-06, "loss": 1.0491, "step": 20959 }, { "epoch": 0.63, "learning_rate": 1.5795480094745475e-06, "loss": 1.11, "step": 20960 }, { "epoch": 0.63, "learning_rate": 1.5793212281629134e-06, "loss": 1.1774, "step": 20961 }, { "epoch": 0.63, "learning_rate": 1.5790944556156974e-06, "loss": 1.11, "step": 20962 }, { "epoch": 0.63, "learning_rate": 1.5788676918350583e-06, "loss": 1.1577, "step": 20963 }, { "epoch": 0.63, "learning_rate": 1.5786409368231552e-06, "loss": 1.1344, "step": 20964 }, { "epoch": 0.63, "learning_rate": 1.5784141905821471e-06, "loss": 1.0864, "step": 20965 }, { "epoch": 0.63, "learning_rate": 1.5781874531141914e-06, "loss": 1.0026, "step": 20966 }, { "epoch": 0.63, "learning_rate": 1.5779607244214474e-06, "loss": 1.2198, "step": 20967 }, { "epoch": 0.63, "learning_rate": 1.577734004506073e-06, "loss": 1.0182, "step": 20968 }, { "epoch": 0.63, "learning_rate": 1.577507293370228e-06, "loss": 1.1848, "step": 20969 }, { "epoch": 0.63, "learning_rate": 1.577280591016068e-06, "loss": 1.0487, "step": 20970 }, { "epoch": 0.63, "learning_rate": 1.5770538974457524e-06, "loss": 1.089, "step": 20971 }, { "epoch": 0.63, "learning_rate": 1.5768272126614393e-06, "loss": 1.0938, "step": 20972 }, { "epoch": 0.63, "learning_rate": 1.5766005366652865e-06, "loss": 1.1181, "step": 20973 }, { "epoch": 0.63, "learning_rate": 1.576373869459453e-06, "loss": 1.2036, "step": 20974 }, { "epoch": 0.63, "learning_rate": 1.5761472110460944e-06, "loss": 1.1845, "step": 20975 }, { "epoch": 0.63, "learning_rate": 1.5759205614273692e-06, "loss": 1.1495, "step": 20976 }, { "epoch": 0.63, "learning_rate": 1.5756939206054352e-06, "loss": 1.1151, "step": 20977 }, { "epoch": 0.63, "learning_rate": 1.5754672885824507e-06, "loss": 1.141, "step": 20978 }, { "epoch": 0.63, "learning_rate": 1.5752406653605718e-06, "loss": 1.1412, "step": 20979 }, { "epoch": 0.63, "learning_rate": 1.5750140509419562e-06, "loss": 1.3185, "step": 20980 }, { "epoch": 0.63, "learning_rate": 1.5747874453287615e-06, "loss": 1.2095, "step": 20981 }, { "epoch": 0.63, "learning_rate": 1.5745608485231455e-06, "loss": 1.1144, "step": 20982 }, { "epoch": 0.63, "learning_rate": 1.5743342605272637e-06, "loss": 1.1744, "step": 20983 }, { "epoch": 0.63, "learning_rate": 1.5741076813432738e-06, "loss": 1.1185, "step": 20984 }, { "epoch": 0.63, "learning_rate": 1.573881110973333e-06, "loss": 1.1763, "step": 20985 }, { "epoch": 0.63, "learning_rate": 1.573654549419598e-06, "loss": 1.123, "step": 20986 }, { "epoch": 0.63, "learning_rate": 1.5734279966842264e-06, "loss": 1.163, "step": 20987 }, { "epoch": 0.63, "learning_rate": 1.573201452769373e-06, "loss": 1.1205, "step": 20988 }, { "epoch": 0.63, "learning_rate": 1.5729749176771954e-06, "loss": 1.1544, "step": 20989 }, { "epoch": 0.63, "learning_rate": 1.5727483914098501e-06, "loss": 1.198, "step": 20990 }, { "epoch": 0.63, "learning_rate": 1.5725218739694942e-06, "loss": 1.0872, "step": 20991 }, { "epoch": 0.63, "learning_rate": 1.5722953653582829e-06, "loss": 1.1189, "step": 20992 }, { "epoch": 0.63, "learning_rate": 1.5720688655783727e-06, "loss": 1.2479, "step": 20993 }, { "epoch": 0.63, "learning_rate": 1.5718423746319204e-06, "loss": 1.0686, "step": 20994 }, { "epoch": 0.63, "learning_rate": 1.5716158925210823e-06, "loss": 1.0531, "step": 20995 }, { "epoch": 0.63, "learning_rate": 1.5713894192480129e-06, "loss": 1.0817, "step": 20996 }, { "epoch": 0.63, "learning_rate": 1.5711629548148687e-06, "loss": 1.132, "step": 20997 }, { "epoch": 0.63, "learning_rate": 1.5709364992238062e-06, "loss": 1.1365, "step": 20998 }, { "epoch": 0.63, "learning_rate": 1.5707100524769809e-06, "loss": 1.0616, "step": 20999 }, { "epoch": 0.63, "learning_rate": 1.570483614576549e-06, "loss": 0.9748, "step": 21000 }, { "epoch": 0.63, "learning_rate": 1.5702571855246645e-06, "loss": 1.1283, "step": 21001 }, { "epoch": 0.63, "learning_rate": 1.570030765323484e-06, "loss": 1.0892, "step": 21002 }, { "epoch": 0.63, "learning_rate": 1.5698043539751626e-06, "loss": 1.0352, "step": 21003 }, { "epoch": 0.63, "learning_rate": 1.569577951481856e-06, "loss": 1.1371, "step": 21004 }, { "epoch": 0.63, "learning_rate": 1.569351557845719e-06, "loss": 1.0471, "step": 21005 }, { "epoch": 0.63, "learning_rate": 1.5691251730689069e-06, "loss": 1.0976, "step": 21006 }, { "epoch": 0.63, "learning_rate": 1.5688987971535746e-06, "loss": 1.1419, "step": 21007 }, { "epoch": 0.63, "learning_rate": 1.5686724301018789e-06, "loss": 1.0262, "step": 21008 }, { "epoch": 0.63, "learning_rate": 1.5684460719159717e-06, "loss": 1.0452, "step": 21009 }, { "epoch": 0.63, "learning_rate": 1.5682197225980091e-06, "loss": 1.1008, "step": 21010 }, { "epoch": 0.63, "learning_rate": 1.5679933821501463e-06, "loss": 1.0916, "step": 21011 }, { "epoch": 0.63, "learning_rate": 1.5677670505745373e-06, "loss": 1.0837, "step": 21012 }, { "epoch": 0.63, "learning_rate": 1.5675407278733385e-06, "loss": 1.1556, "step": 21013 }, { "epoch": 0.63, "learning_rate": 1.5673144140487014e-06, "loss": 1.0617, "step": 21014 }, { "epoch": 0.63, "learning_rate": 1.5670881091027821e-06, "loss": 1.1069, "step": 21015 }, { "epoch": 0.63, "learning_rate": 1.5668618130377345e-06, "loss": 1.0157, "step": 21016 }, { "epoch": 0.63, "learning_rate": 1.5666355258557137e-06, "loss": 1.0734, "step": 21017 }, { "epoch": 0.63, "learning_rate": 1.5664092475588727e-06, "loss": 1.0997, "step": 21018 }, { "epoch": 0.63, "learning_rate": 1.566182978149366e-06, "loss": 1.0228, "step": 21019 }, { "epoch": 0.63, "learning_rate": 1.5659567176293477e-06, "loss": 1.1641, "step": 21020 }, { "epoch": 0.63, "learning_rate": 1.5657304660009725e-06, "loss": 1.2411, "step": 21021 }, { "epoch": 0.63, "learning_rate": 1.5655042232663921e-06, "loss": 1.1208, "step": 21022 }, { "epoch": 0.63, "learning_rate": 1.5652779894277618e-06, "loss": 1.1721, "step": 21023 }, { "epoch": 0.63, "learning_rate": 1.5650517644872345e-06, "loss": 1.0756, "step": 21024 }, { "epoch": 0.63, "learning_rate": 1.5648255484469644e-06, "loss": 1.215, "step": 21025 }, { "epoch": 0.63, "learning_rate": 1.5645993413091057e-06, "loss": 1.1627, "step": 21026 }, { "epoch": 0.63, "learning_rate": 1.5643731430758098e-06, "loss": 1.0616, "step": 21027 }, { "epoch": 0.63, "learning_rate": 1.5641469537492304e-06, "loss": 1.0146, "step": 21028 }, { "epoch": 0.63, "learning_rate": 1.563920773331522e-06, "loss": 1.1543, "step": 21029 }, { "epoch": 0.63, "learning_rate": 1.5636946018248373e-06, "loss": 1.1744, "step": 21030 }, { "epoch": 0.63, "learning_rate": 1.5634684392313282e-06, "loss": 1.1055, "step": 21031 }, { "epoch": 0.63, "learning_rate": 1.5632422855531488e-06, "loss": 1.2343, "step": 21032 }, { "epoch": 0.63, "learning_rate": 1.563016140792452e-06, "loss": 0.994, "step": 21033 }, { "epoch": 0.63, "learning_rate": 1.5627900049513906e-06, "loss": 1.072, "step": 21034 }, { "epoch": 0.63, "learning_rate": 1.5625638780321162e-06, "loss": 1.1554, "step": 21035 }, { "epoch": 0.63, "learning_rate": 1.5623377600367822e-06, "loss": 1.2567, "step": 21036 }, { "epoch": 0.63, "learning_rate": 1.5621116509675413e-06, "loss": 1.0911, "step": 21037 }, { "epoch": 0.63, "learning_rate": 1.5618855508265457e-06, "loss": 1.2721, "step": 21038 }, { "epoch": 0.63, "learning_rate": 1.561659459615949e-06, "loss": 1.1462, "step": 21039 }, { "epoch": 0.63, "learning_rate": 1.561433377337901e-06, "loss": 1.1715, "step": 21040 }, { "epoch": 0.63, "learning_rate": 1.5612073039945553e-06, "loss": 1.2261, "step": 21041 }, { "epoch": 0.63, "learning_rate": 1.560981239588064e-06, "loss": 1.1224, "step": 21042 }, { "epoch": 0.63, "learning_rate": 1.5607551841205798e-06, "loss": 1.0969, "step": 21043 }, { "epoch": 0.63, "learning_rate": 1.5605291375942536e-06, "loss": 1.0197, "step": 21044 }, { "epoch": 0.63, "learning_rate": 1.560303100011237e-06, "loss": 1.1096, "step": 21045 }, { "epoch": 0.63, "learning_rate": 1.5600770713736824e-06, "loss": 1.0578, "step": 21046 }, { "epoch": 0.63, "learning_rate": 1.5598510516837418e-06, "loss": 1.0981, "step": 21047 }, { "epoch": 0.63, "learning_rate": 1.5596250409435662e-06, "loss": 1.1197, "step": 21048 }, { "epoch": 0.63, "learning_rate": 1.5593990391553072e-06, "loss": 1.1752, "step": 21049 }, { "epoch": 0.63, "learning_rate": 1.559173046321116e-06, "loss": 1.1948, "step": 21050 }, { "epoch": 0.63, "learning_rate": 1.5589470624431446e-06, "loss": 1.0805, "step": 21051 }, { "epoch": 0.63, "learning_rate": 1.5587210875235449e-06, "loss": 1.1268, "step": 21052 }, { "epoch": 0.63, "learning_rate": 1.5584951215644661e-06, "loss": 1.0688, "step": 21053 }, { "epoch": 0.63, "learning_rate": 1.5582691645680602e-06, "loss": 1.1136, "step": 21054 }, { "epoch": 0.63, "learning_rate": 1.5580432165364783e-06, "loss": 1.044, "step": 21055 }, { "epoch": 0.63, "learning_rate": 1.5578172774718726e-06, "loss": 1.1325, "step": 21056 }, { "epoch": 0.63, "learning_rate": 1.5575913473763916e-06, "loss": 1.0808, "step": 21057 }, { "epoch": 0.63, "learning_rate": 1.5573654262521868e-06, "loss": 1.0441, "step": 21058 }, { "epoch": 0.63, "learning_rate": 1.5571395141014092e-06, "loss": 1.0684, "step": 21059 }, { "epoch": 0.63, "learning_rate": 1.55691361092621e-06, "loss": 1.126, "step": 21060 }, { "epoch": 0.63, "learning_rate": 1.5566877167287386e-06, "loss": 1.1588, "step": 21061 }, { "epoch": 0.63, "learning_rate": 1.5564618315111458e-06, "loss": 1.1375, "step": 21062 }, { "epoch": 0.63, "learning_rate": 1.5562359552755814e-06, "loss": 1.1273, "step": 21063 }, { "epoch": 0.63, "learning_rate": 1.5560100880241967e-06, "loss": 1.0529, "step": 21064 }, { "epoch": 0.63, "learning_rate": 1.5557842297591421e-06, "loss": 1.1273, "step": 21065 }, { "epoch": 0.63, "learning_rate": 1.555558380482566e-06, "loss": 1.1429, "step": 21066 }, { "epoch": 0.63, "learning_rate": 1.5553325401966193e-06, "loss": 1.054, "step": 21067 }, { "epoch": 0.63, "learning_rate": 1.5551067089034518e-06, "loss": 1.1755, "step": 21068 }, { "epoch": 0.63, "learning_rate": 1.5548808866052146e-06, "loss": 1.1118, "step": 21069 }, { "epoch": 0.63, "learning_rate": 1.5546550733040546e-06, "loss": 1.0911, "step": 21070 }, { "epoch": 0.63, "learning_rate": 1.5544292690021234e-06, "loss": 1.1147, "step": 21071 }, { "epoch": 0.63, "learning_rate": 1.5542034737015702e-06, "loss": 1.0753, "step": 21072 }, { "epoch": 0.63, "learning_rate": 1.5539776874045448e-06, "loss": 1.1021, "step": 21073 }, { "epoch": 0.63, "learning_rate": 1.5537519101131957e-06, "loss": 1.189, "step": 21074 }, { "epoch": 0.63, "learning_rate": 1.5535261418296727e-06, "loss": 1.1917, "step": 21075 }, { "epoch": 0.63, "learning_rate": 1.553300382556125e-06, "loss": 1.0444, "step": 21076 }, { "epoch": 0.63, "learning_rate": 1.5530746322947015e-06, "loss": 1.0624, "step": 21077 }, { "epoch": 0.63, "learning_rate": 1.5528488910475528e-06, "loss": 1.0218, "step": 21078 }, { "epoch": 0.64, "learning_rate": 1.5526231588168253e-06, "loss": 1.1838, "step": 21079 }, { "epoch": 0.64, "learning_rate": 1.552397435604669e-06, "loss": 1.0865, "step": 21080 }, { "epoch": 0.64, "learning_rate": 1.5521717214132328e-06, "loss": 1.168, "step": 21081 }, { "epoch": 0.64, "learning_rate": 1.5519460162446665e-06, "loss": 1.0704, "step": 21082 }, { "epoch": 0.64, "learning_rate": 1.5517203201011164e-06, "loss": 0.9963, "step": 21083 }, { "epoch": 0.64, "learning_rate": 1.5514946329847318e-06, "loss": 1.1591, "step": 21084 }, { "epoch": 0.64, "learning_rate": 1.551268954897662e-06, "loss": 1.0641, "step": 21085 }, { "epoch": 0.64, "learning_rate": 1.5510432858420552e-06, "loss": 1.0937, "step": 21086 }, { "epoch": 0.64, "learning_rate": 1.5508176258200585e-06, "loss": 1.0924, "step": 21087 }, { "epoch": 0.64, "learning_rate": 1.550591974833821e-06, "loss": 1.1202, "step": 21088 }, { "epoch": 0.64, "learning_rate": 1.5503663328854909e-06, "loss": 1.1232, "step": 21089 }, { "epoch": 0.64, "learning_rate": 1.5501406999772157e-06, "loss": 1.0344, "step": 21090 }, { "epoch": 0.64, "learning_rate": 1.5499150761111447e-06, "loss": 1.2241, "step": 21091 }, { "epoch": 0.64, "learning_rate": 1.5496894612894237e-06, "loss": 1.0379, "step": 21092 }, { "epoch": 0.64, "learning_rate": 1.549463855514201e-06, "loss": 1.1333, "step": 21093 }, { "epoch": 0.64, "learning_rate": 1.5492382587876248e-06, "loss": 1.1172, "step": 21094 }, { "epoch": 0.64, "learning_rate": 1.5490126711118435e-06, "loss": 1.0446, "step": 21095 }, { "epoch": 0.64, "learning_rate": 1.5487870924890026e-06, "loss": 1.1646, "step": 21096 }, { "epoch": 0.64, "learning_rate": 1.5485615229212502e-06, "loss": 1.1043, "step": 21097 }, { "epoch": 0.64, "learning_rate": 1.5483359624107342e-06, "loss": 1.1377, "step": 21098 }, { "epoch": 0.64, "learning_rate": 1.5481104109596018e-06, "loss": 1.2593, "step": 21099 }, { "epoch": 0.64, "learning_rate": 1.5478848685699994e-06, "loss": 1.1187, "step": 21100 }, { "epoch": 0.64, "learning_rate": 1.5476593352440744e-06, "loss": 1.1731, "step": 21101 }, { "epoch": 0.64, "learning_rate": 1.547433810983974e-06, "loss": 0.9746, "step": 21102 }, { "epoch": 0.64, "learning_rate": 1.547208295791845e-06, "loss": 1.0703, "step": 21103 }, { "epoch": 0.64, "learning_rate": 1.5469827896698348e-06, "loss": 1.0991, "step": 21104 }, { "epoch": 0.64, "learning_rate": 1.546757292620089e-06, "loss": 1.1459, "step": 21105 }, { "epoch": 0.64, "learning_rate": 1.5465318046447542e-06, "loss": 1.1173, "step": 21106 }, { "epoch": 0.64, "learning_rate": 1.5463063257459776e-06, "loss": 1.027, "step": 21107 }, { "epoch": 0.64, "learning_rate": 1.5460808559259063e-06, "loss": 1.116, "step": 21108 }, { "epoch": 0.64, "learning_rate": 1.545855395186685e-06, "loss": 1.1266, "step": 21109 }, { "epoch": 0.64, "learning_rate": 1.545629943530461e-06, "loss": 1.0853, "step": 21110 }, { "epoch": 0.64, "learning_rate": 1.5454045009593799e-06, "loss": 1.1507, "step": 21111 }, { "epoch": 0.64, "learning_rate": 1.545179067475589e-06, "loss": 1.0987, "step": 21112 }, { "epoch": 0.64, "learning_rate": 1.544953643081233e-06, "loss": 1.1865, "step": 21113 }, { "epoch": 0.64, "learning_rate": 1.544728227778458e-06, "loss": 1.1477, "step": 21114 }, { "epoch": 0.64, "learning_rate": 1.544502821569411e-06, "loss": 1.0167, "step": 21115 }, { "epoch": 0.64, "learning_rate": 1.5442774244562363e-06, "loss": 1.1144, "step": 21116 }, { "epoch": 0.64, "learning_rate": 1.544052036441081e-06, "loss": 1.0677, "step": 21117 }, { "epoch": 0.64, "learning_rate": 1.5438266575260892e-06, "loss": 1.0608, "step": 21118 }, { "epoch": 0.64, "learning_rate": 1.5436012877134072e-06, "loss": 1.1541, "step": 21119 }, { "epoch": 0.64, "learning_rate": 1.5433759270051802e-06, "loss": 1.1154, "step": 21120 }, { "epoch": 0.64, "learning_rate": 1.5431505754035547e-06, "loss": 1.1252, "step": 21121 }, { "epoch": 0.64, "learning_rate": 1.5429252329106743e-06, "loss": 1.1479, "step": 21122 }, { "epoch": 0.64, "learning_rate": 1.542699899528684e-06, "loss": 1.0854, "step": 21123 }, { "epoch": 0.64, "learning_rate": 1.54247457525973e-06, "loss": 1.2039, "step": 21124 }, { "epoch": 0.64, "learning_rate": 1.5422492601059575e-06, "loss": 1.0754, "step": 21125 }, { "epoch": 0.64, "learning_rate": 1.5420239540695104e-06, "loss": 1.0243, "step": 21126 }, { "epoch": 0.64, "learning_rate": 1.5417986571525336e-06, "loss": 1.0276, "step": 21127 }, { "epoch": 0.64, "learning_rate": 1.5415733693571722e-06, "loss": 1.1554, "step": 21128 }, { "epoch": 0.64, "learning_rate": 1.5413480906855704e-06, "loss": 1.204, "step": 21129 }, { "epoch": 0.64, "learning_rate": 1.541122821139874e-06, "loss": 1.1323, "step": 21130 }, { "epoch": 0.64, "learning_rate": 1.540897560722226e-06, "loss": 1.0614, "step": 21131 }, { "epoch": 0.64, "learning_rate": 1.540672309434771e-06, "loss": 1.1507, "step": 21132 }, { "epoch": 0.64, "learning_rate": 1.5404470672796537e-06, "loss": 1.1849, "step": 21133 }, { "epoch": 0.64, "learning_rate": 1.5402218342590192e-06, "loss": 1.0086, "step": 21134 }, { "epoch": 0.64, "learning_rate": 1.5399966103750097e-06, "loss": 1.2108, "step": 21135 }, { "epoch": 0.64, "learning_rate": 1.53977139562977e-06, "loss": 1.0177, "step": 21136 }, { "epoch": 0.64, "learning_rate": 1.5395461900254441e-06, "loss": 1.2343, "step": 21137 }, { "epoch": 0.64, "learning_rate": 1.539320993564177e-06, "loss": 1.0784, "step": 21138 }, { "epoch": 0.64, "learning_rate": 1.5390958062481104e-06, "loss": 1.0416, "step": 21139 }, { "epoch": 0.64, "learning_rate": 1.5388706280793888e-06, "loss": 1.1097, "step": 21140 }, { "epoch": 0.64, "learning_rate": 1.538645459060156e-06, "loss": 1.1667, "step": 21141 }, { "epoch": 0.64, "learning_rate": 1.5384202991925554e-06, "loss": 1.0802, "step": 21142 }, { "epoch": 0.64, "learning_rate": 1.538195148478731e-06, "loss": 0.9866, "step": 21143 }, { "epoch": 0.64, "learning_rate": 1.537970006920825e-06, "loss": 1.1005, "step": 21144 }, { "epoch": 0.64, "learning_rate": 1.537744874520981e-06, "loss": 1.092, "step": 21145 }, { "epoch": 0.64, "learning_rate": 1.5375197512813427e-06, "loss": 1.0916, "step": 21146 }, { "epoch": 0.64, "learning_rate": 1.5372946372040536e-06, "loss": 0.9981, "step": 21147 }, { "epoch": 0.64, "learning_rate": 1.5370695322912551e-06, "loss": 1.1993, "step": 21148 }, { "epoch": 0.64, "learning_rate": 1.5368444365450908e-06, "loss": 1.1683, "step": 21149 }, { "epoch": 0.64, "learning_rate": 1.5366193499677038e-06, "loss": 0.975, "step": 21150 }, { "epoch": 0.64, "learning_rate": 1.5363942725612375e-06, "loss": 1.1731, "step": 21151 }, { "epoch": 0.64, "learning_rate": 1.5361692043278323e-06, "loss": 1.0912, "step": 21152 }, { "epoch": 0.64, "learning_rate": 1.5359441452696321e-06, "loss": 1.0897, "step": 21153 }, { "epoch": 0.64, "learning_rate": 1.5357190953887795e-06, "loss": 1.1607, "step": 21154 }, { "epoch": 0.64, "learning_rate": 1.5354940546874176e-06, "loss": 1.1505, "step": 21155 }, { "epoch": 0.64, "learning_rate": 1.535269023167687e-06, "loss": 1.1066, "step": 21156 }, { "epoch": 0.64, "learning_rate": 1.5350440008317303e-06, "loss": 0.9783, "step": 21157 }, { "epoch": 0.64, "learning_rate": 1.5348189876816905e-06, "loss": 1.0876, "step": 21158 }, { "epoch": 0.64, "learning_rate": 1.5345939837197088e-06, "loss": 1.1224, "step": 21159 }, { "epoch": 0.64, "learning_rate": 1.5343689889479286e-06, "loss": 1.1141, "step": 21160 }, { "epoch": 0.64, "learning_rate": 1.534144003368489e-06, "loss": 1.1471, "step": 21161 }, { "epoch": 0.64, "learning_rate": 1.533919026983534e-06, "loss": 1.1537, "step": 21162 }, { "epoch": 0.64, "learning_rate": 1.5336940597952045e-06, "loss": 1.0537, "step": 21163 }, { "epoch": 0.64, "learning_rate": 1.5334691018056427e-06, "loss": 1.063, "step": 21164 }, { "epoch": 0.64, "learning_rate": 1.533244153016989e-06, "loss": 1.0515, "step": 21165 }, { "epoch": 0.64, "learning_rate": 1.533019213431385e-06, "loss": 1.0581, "step": 21166 }, { "epoch": 0.64, "learning_rate": 1.5327942830509728e-06, "loss": 1.2468, "step": 21167 }, { "epoch": 0.64, "learning_rate": 1.5325693618778934e-06, "loss": 1.095, "step": 21168 }, { "epoch": 0.64, "learning_rate": 1.5323444499142873e-06, "loss": 1.0906, "step": 21169 }, { "epoch": 0.64, "learning_rate": 1.532119547162296e-06, "loss": 1.0199, "step": 21170 }, { "epoch": 0.64, "learning_rate": 1.5318946536240603e-06, "loss": 1.1376, "step": 21171 }, { "epoch": 0.64, "learning_rate": 1.5316697693017216e-06, "loss": 1.0542, "step": 21172 }, { "epoch": 0.64, "learning_rate": 1.5314448941974214e-06, "loss": 1.1357, "step": 21173 }, { "epoch": 0.64, "learning_rate": 1.5312200283132977e-06, "loss": 1.0705, "step": 21174 }, { "epoch": 0.64, "learning_rate": 1.530995171651493e-06, "loss": 1.1627, "step": 21175 }, { "epoch": 0.64, "learning_rate": 1.530770324214148e-06, "loss": 1.1562, "step": 21176 }, { "epoch": 0.64, "learning_rate": 1.5305454860034036e-06, "loss": 1.1921, "step": 21177 }, { "epoch": 0.64, "learning_rate": 1.530320657021398e-06, "loss": 1.0984, "step": 21178 }, { "epoch": 0.64, "learning_rate": 1.530095837270273e-06, "loss": 1.2198, "step": 21179 }, { "epoch": 0.64, "learning_rate": 1.5298710267521683e-06, "loss": 1.0974, "step": 21180 }, { "epoch": 0.64, "learning_rate": 1.5296462254692245e-06, "loss": 1.2466, "step": 21181 }, { "epoch": 0.64, "learning_rate": 1.5294214334235813e-06, "loss": 1.1121, "step": 21182 }, { "epoch": 0.64, "learning_rate": 1.5291966506173784e-06, "loss": 1.11, "step": 21183 }, { "epoch": 0.64, "learning_rate": 1.5289718770527556e-06, "loss": 1.1357, "step": 21184 }, { "epoch": 0.64, "learning_rate": 1.528747112731853e-06, "loss": 1.1635, "step": 21185 }, { "epoch": 0.64, "learning_rate": 1.5285223576568111e-06, "loss": 1.0782, "step": 21186 }, { "epoch": 0.64, "learning_rate": 1.5282976118297676e-06, "loss": 1.1296, "step": 21187 }, { "epoch": 0.64, "learning_rate": 1.5280728752528628e-06, "loss": 1.0533, "step": 21188 }, { "epoch": 0.64, "learning_rate": 1.527848147928236e-06, "loss": 1.1323, "step": 21189 }, { "epoch": 0.64, "learning_rate": 1.5276234298580278e-06, "loss": 1.059, "step": 21190 }, { "epoch": 0.64, "learning_rate": 1.5273987210443753e-06, "loss": 1.1218, "step": 21191 }, { "epoch": 0.64, "learning_rate": 1.5271740214894182e-06, "loss": 1.2083, "step": 21192 }, { "epoch": 0.64, "learning_rate": 1.5269493311952962e-06, "loss": 1.2083, "step": 21193 }, { "epoch": 0.64, "learning_rate": 1.5267246501641484e-06, "loss": 1.0804, "step": 21194 }, { "epoch": 0.64, "learning_rate": 1.5264999783981127e-06, "loss": 1.1136, "step": 21195 }, { "epoch": 0.64, "learning_rate": 1.5262753158993282e-06, "loss": 1.1373, "step": 21196 }, { "epoch": 0.64, "learning_rate": 1.5260506626699339e-06, "loss": 1.0634, "step": 21197 }, { "epoch": 0.64, "learning_rate": 1.5258260187120686e-06, "loss": 1.1578, "step": 21198 }, { "epoch": 0.64, "learning_rate": 1.5256013840278706e-06, "loss": 0.9919, "step": 21199 }, { "epoch": 0.64, "learning_rate": 1.5253767586194773e-06, "loss": 1.1544, "step": 21200 }, { "epoch": 0.64, "learning_rate": 1.5251521424890282e-06, "loss": 1.1774, "step": 21201 }, { "epoch": 0.64, "learning_rate": 1.5249275356386608e-06, "loss": 0.9694, "step": 21202 }, { "epoch": 0.64, "learning_rate": 1.524702938070515e-06, "loss": 1.0739, "step": 21203 }, { "epoch": 0.64, "learning_rate": 1.5244783497867266e-06, "loss": 1.0325, "step": 21204 }, { "epoch": 0.64, "learning_rate": 1.5242537707894338e-06, "loss": 1.1222, "step": 21205 }, { "epoch": 0.64, "learning_rate": 1.5240292010807761e-06, "loss": 1.1163, "step": 21206 }, { "epoch": 0.64, "learning_rate": 1.5238046406628903e-06, "loss": 1.1035, "step": 21207 }, { "epoch": 0.64, "learning_rate": 1.5235800895379138e-06, "loss": 1.0787, "step": 21208 }, { "epoch": 0.64, "learning_rate": 1.523355547707985e-06, "loss": 1.1546, "step": 21209 }, { "epoch": 0.64, "learning_rate": 1.5231310151752408e-06, "loss": 1.1053, "step": 21210 }, { "epoch": 0.64, "learning_rate": 1.5229064919418185e-06, "loss": 1.0997, "step": 21211 }, { "epoch": 0.64, "learning_rate": 1.5226819780098564e-06, "loss": 1.1917, "step": 21212 }, { "epoch": 0.64, "learning_rate": 1.522457473381491e-06, "loss": 1.2139, "step": 21213 }, { "epoch": 0.64, "learning_rate": 1.5222329780588593e-06, "loss": 1.0984, "step": 21214 }, { "epoch": 0.64, "learning_rate": 1.5220084920440985e-06, "loss": 1.0688, "step": 21215 }, { "epoch": 0.64, "learning_rate": 1.5217840153393476e-06, "loss": 1.0344, "step": 21216 }, { "epoch": 0.64, "learning_rate": 1.5215595479467404e-06, "loss": 1.2052, "step": 21217 }, { "epoch": 0.64, "learning_rate": 1.5213350898684149e-06, "loss": 1.1208, "step": 21218 }, { "epoch": 0.64, "learning_rate": 1.521110641106508e-06, "loss": 1.0996, "step": 21219 }, { "epoch": 0.64, "learning_rate": 1.5208862016631575e-06, "loss": 0.9837, "step": 21220 }, { "epoch": 0.64, "learning_rate": 1.520661771540498e-06, "loss": 1.1033, "step": 21221 }, { "epoch": 0.64, "learning_rate": 1.5204373507406662e-06, "loss": 1.0833, "step": 21222 }, { "epoch": 0.64, "learning_rate": 1.5202129392657995e-06, "loss": 1.1212, "step": 21223 }, { "epoch": 0.64, "learning_rate": 1.5199885371180335e-06, "loss": 1.2449, "step": 21224 }, { "epoch": 0.64, "learning_rate": 1.5197641442995053e-06, "loss": 1.0748, "step": 21225 }, { "epoch": 0.64, "learning_rate": 1.5195397608123497e-06, "loss": 1.1514, "step": 21226 }, { "epoch": 0.64, "learning_rate": 1.5193153866587036e-06, "loss": 1.0645, "step": 21227 }, { "epoch": 0.64, "learning_rate": 1.5190910218407024e-06, "loss": 1.1279, "step": 21228 }, { "epoch": 0.64, "learning_rate": 1.5188666663604834e-06, "loss": 1.1682, "step": 21229 }, { "epoch": 0.64, "learning_rate": 1.5186423202201804e-06, "loss": 1.1234, "step": 21230 }, { "epoch": 0.64, "learning_rate": 1.5184179834219298e-06, "loss": 1.0197, "step": 21231 }, { "epoch": 0.64, "learning_rate": 1.518193655967867e-06, "loss": 1.0831, "step": 21232 }, { "epoch": 0.64, "learning_rate": 1.517969337860129e-06, "loss": 1.1075, "step": 21233 }, { "epoch": 0.64, "learning_rate": 1.5177450291008489e-06, "loss": 1.0753, "step": 21234 }, { "epoch": 0.64, "learning_rate": 1.517520729692163e-06, "loss": 1.1028, "step": 21235 }, { "epoch": 0.64, "learning_rate": 1.5172964396362064e-06, "loss": 1.1035, "step": 21236 }, { "epoch": 0.64, "learning_rate": 1.5170721589351145e-06, "loss": 1.1998, "step": 21237 }, { "epoch": 0.64, "learning_rate": 1.5168478875910232e-06, "loss": 1.0592, "step": 21238 }, { "epoch": 0.64, "learning_rate": 1.5166236256060655e-06, "loss": 1.0862, "step": 21239 }, { "epoch": 0.64, "learning_rate": 1.5163993729823772e-06, "loss": 1.1028, "step": 21240 }, { "epoch": 0.64, "learning_rate": 1.5161751297220933e-06, "loss": 1.1788, "step": 21241 }, { "epoch": 0.64, "learning_rate": 1.5159508958273494e-06, "loss": 1.0892, "step": 21242 }, { "epoch": 0.64, "learning_rate": 1.5157266713002783e-06, "loss": 1.1074, "step": 21243 }, { "epoch": 0.64, "learning_rate": 1.515502456143015e-06, "loss": 1.0554, "step": 21244 }, { "epoch": 0.64, "learning_rate": 1.515278250357694e-06, "loss": 1.2158, "step": 21245 }, { "epoch": 0.64, "learning_rate": 1.5150540539464509e-06, "loss": 1.1207, "step": 21246 }, { "epoch": 0.64, "learning_rate": 1.514829866911418e-06, "loss": 1.121, "step": 21247 }, { "epoch": 0.64, "learning_rate": 1.51460568925473e-06, "loss": 1.1808, "step": 21248 }, { "epoch": 0.64, "learning_rate": 1.5143815209785214e-06, "loss": 1.1337, "step": 21249 }, { "epoch": 0.64, "learning_rate": 1.5141573620849262e-06, "loss": 1.1037, "step": 21250 }, { "epoch": 0.64, "learning_rate": 1.5139332125760786e-06, "loss": 1.127, "step": 21251 }, { "epoch": 0.64, "learning_rate": 1.5137090724541112e-06, "loss": 1.1252, "step": 21252 }, { "epoch": 0.64, "learning_rate": 1.5134849417211582e-06, "loss": 1.1407, "step": 21253 }, { "epoch": 0.64, "learning_rate": 1.5132608203793542e-06, "loss": 1.0346, "step": 21254 }, { "epoch": 0.64, "learning_rate": 1.5130367084308322e-06, "loss": 1.2255, "step": 21255 }, { "epoch": 0.64, "learning_rate": 1.5128126058777248e-06, "loss": 1.2271, "step": 21256 }, { "epoch": 0.64, "learning_rate": 1.5125885127221656e-06, "loss": 1.1154, "step": 21257 }, { "epoch": 0.64, "learning_rate": 1.5123644289662887e-06, "loss": 1.0679, "step": 21258 }, { "epoch": 0.64, "learning_rate": 1.5121403546122277e-06, "loss": 1.112, "step": 21259 }, { "epoch": 0.64, "learning_rate": 1.5119162896621134e-06, "loss": 1.0707, "step": 21260 }, { "epoch": 0.64, "learning_rate": 1.5116922341180803e-06, "loss": 1.0802, "step": 21261 }, { "epoch": 0.64, "learning_rate": 1.5114681879822613e-06, "loss": 1.1715, "step": 21262 }, { "epoch": 0.64, "learning_rate": 1.5112441512567888e-06, "loss": 1.0406, "step": 21263 }, { "epoch": 0.64, "learning_rate": 1.5110201239437966e-06, "loss": 1.0899, "step": 21264 }, { "epoch": 0.64, "learning_rate": 1.5107961060454156e-06, "loss": 1.0637, "step": 21265 }, { "epoch": 0.64, "learning_rate": 1.5105720975637795e-06, "loss": 1.161, "step": 21266 }, { "epoch": 0.64, "learning_rate": 1.5103480985010206e-06, "loss": 1.0092, "step": 21267 }, { "epoch": 0.64, "learning_rate": 1.5101241088592719e-06, "loss": 1.1269, "step": 21268 }, { "epoch": 0.64, "learning_rate": 1.509900128640664e-06, "loss": 1.2189, "step": 21269 }, { "epoch": 0.64, "learning_rate": 1.5096761578473302e-06, "loss": 1.1653, "step": 21270 }, { "epoch": 0.64, "learning_rate": 1.5094521964814024e-06, "loss": 1.077, "step": 21271 }, { "epoch": 0.64, "learning_rate": 1.5092282445450135e-06, "loss": 1.0401, "step": 21272 }, { "epoch": 0.64, "learning_rate": 1.5090043020402936e-06, "loss": 1.1394, "step": 21273 }, { "epoch": 0.64, "learning_rate": 1.5087803689693752e-06, "loss": 1.2209, "step": 21274 }, { "epoch": 0.64, "learning_rate": 1.508556445334391e-06, "loss": 1.1524, "step": 21275 }, { "epoch": 0.64, "learning_rate": 1.5083325311374713e-06, "loss": 1.0193, "step": 21276 }, { "epoch": 0.64, "learning_rate": 1.5081086263807491e-06, "loss": 0.9824, "step": 21277 }, { "epoch": 0.64, "learning_rate": 1.5078847310663544e-06, "loss": 1.0951, "step": 21278 }, { "epoch": 0.64, "learning_rate": 1.5076608451964192e-06, "loss": 1.0339, "step": 21279 }, { "epoch": 0.64, "learning_rate": 1.5074369687730756e-06, "loss": 1.2064, "step": 21280 }, { "epoch": 0.64, "learning_rate": 1.5072131017984536e-06, "loss": 0.9741, "step": 21281 }, { "epoch": 0.64, "learning_rate": 1.5069892442746848e-06, "loss": 1.0078, "step": 21282 }, { "epoch": 0.64, "learning_rate": 1.5067653962038996e-06, "loss": 1.0571, "step": 21283 }, { "epoch": 0.64, "learning_rate": 1.5065415575882296e-06, "loss": 1.033, "step": 21284 }, { "epoch": 0.64, "learning_rate": 1.506317728429807e-06, "loss": 1.0651, "step": 21285 }, { "epoch": 0.64, "learning_rate": 1.5060939087307597e-06, "loss": 1.1271, "step": 21286 }, { "epoch": 0.64, "learning_rate": 1.5058700984932195e-06, "loss": 1.1812, "step": 21287 }, { "epoch": 0.64, "learning_rate": 1.5056462977193177e-06, "loss": 1.1525, "step": 21288 }, { "epoch": 0.64, "learning_rate": 1.5054225064111836e-06, "loss": 1.0059, "step": 21289 }, { "epoch": 0.64, "learning_rate": 1.505198724570949e-06, "loss": 1.1198, "step": 21290 }, { "epoch": 0.64, "learning_rate": 1.5049749522007434e-06, "loss": 1.0197, "step": 21291 }, { "epoch": 0.64, "learning_rate": 1.5047511893026968e-06, "loss": 1.1312, "step": 21292 }, { "epoch": 0.64, "learning_rate": 1.504527435878939e-06, "loss": 1.0737, "step": 21293 }, { "epoch": 0.64, "learning_rate": 1.5043036919316017e-06, "loss": 1.0464, "step": 21294 }, { "epoch": 0.64, "learning_rate": 1.5040799574628128e-06, "loss": 1.1161, "step": 21295 }, { "epoch": 0.64, "learning_rate": 1.503856232474703e-06, "loss": 1.0585, "step": 21296 }, { "epoch": 0.64, "learning_rate": 1.5036325169694026e-06, "loss": 0.9945, "step": 21297 }, { "epoch": 0.64, "learning_rate": 1.5034088109490414e-06, "loss": 1.0881, "step": 21298 }, { "epoch": 0.64, "learning_rate": 1.5031851144157471e-06, "loss": 1.2097, "step": 21299 }, { "epoch": 0.64, "learning_rate": 1.502961427371651e-06, "loss": 1.1066, "step": 21300 }, { "epoch": 0.64, "learning_rate": 1.5027377498188817e-06, "loss": 1.0789, "step": 21301 }, { "epoch": 0.64, "learning_rate": 1.5025140817595685e-06, "loss": 1.0663, "step": 21302 }, { "epoch": 0.64, "learning_rate": 1.5022904231958422e-06, "loss": 1.1302, "step": 21303 }, { "epoch": 0.64, "learning_rate": 1.5020667741298296e-06, "loss": 1.1262, "step": 21304 }, { "epoch": 0.64, "learning_rate": 1.5018431345636603e-06, "loss": 1.1552, "step": 21305 }, { "epoch": 0.64, "learning_rate": 1.5016195044994635e-06, "loss": 1.1861, "step": 21306 }, { "epoch": 0.64, "learning_rate": 1.5013958839393692e-06, "loss": 1.0374, "step": 21307 }, { "epoch": 0.64, "learning_rate": 1.5011722728855045e-06, "loss": 1.048, "step": 21308 }, { "epoch": 0.64, "learning_rate": 1.5009486713399983e-06, "loss": 1.0649, "step": 21309 }, { "epoch": 0.64, "learning_rate": 1.5007250793049798e-06, "loss": 0.9479, "step": 21310 }, { "epoch": 0.64, "learning_rate": 1.5005014967825788e-06, "loss": 1.0634, "step": 21311 }, { "epoch": 0.64, "learning_rate": 1.5002779237749205e-06, "loss": 1.1839, "step": 21312 }, { "epoch": 0.64, "learning_rate": 1.5000543602841352e-06, "loss": 1.2231, "step": 21313 }, { "epoch": 0.64, "learning_rate": 1.4998308063123508e-06, "loss": 1.2217, "step": 21314 }, { "epoch": 0.64, "learning_rate": 1.4996072618616953e-06, "loss": 1.0834, "step": 21315 }, { "epoch": 0.64, "learning_rate": 1.4993837269342981e-06, "loss": 1.0896, "step": 21316 }, { "epoch": 0.64, "learning_rate": 1.4991602015322847e-06, "loss": 1.1339, "step": 21317 }, { "epoch": 0.64, "learning_rate": 1.4989366856577841e-06, "loss": 1.1196, "step": 21318 }, { "epoch": 0.64, "learning_rate": 1.4987131793129245e-06, "loss": 1.1169, "step": 21319 }, { "epoch": 0.64, "learning_rate": 1.4984896824998333e-06, "loss": 1.0856, "step": 21320 }, { "epoch": 0.64, "learning_rate": 1.4982661952206373e-06, "loss": 1.14, "step": 21321 }, { "epoch": 0.64, "learning_rate": 1.4980427174774654e-06, "loss": 1.0959, "step": 21322 }, { "epoch": 0.64, "learning_rate": 1.4978192492724436e-06, "loss": 1.2128, "step": 21323 }, { "epoch": 0.64, "learning_rate": 1.497595790607701e-06, "loss": 1.1446, "step": 21324 }, { "epoch": 0.64, "learning_rate": 1.497372341485363e-06, "loss": 1.2662, "step": 21325 }, { "epoch": 0.64, "learning_rate": 1.4971489019075571e-06, "loss": 1.0538, "step": 21326 }, { "epoch": 0.64, "learning_rate": 1.496925471876411e-06, "loss": 1.1836, "step": 21327 }, { "epoch": 0.64, "learning_rate": 1.4967020513940521e-06, "loss": 1.092, "step": 21328 }, { "epoch": 0.64, "learning_rate": 1.4964786404626054e-06, "loss": 1.0677, "step": 21329 }, { "epoch": 0.64, "learning_rate": 1.4962552390841988e-06, "loss": 1.0384, "step": 21330 }, { "epoch": 0.64, "learning_rate": 1.496031847260959e-06, "loss": 1.0594, "step": 21331 }, { "epoch": 0.64, "learning_rate": 1.4958084649950123e-06, "loss": 1.0198, "step": 21332 }, { "epoch": 0.64, "learning_rate": 1.495585092288486e-06, "loss": 1.0557, "step": 21333 }, { "epoch": 0.64, "learning_rate": 1.4953617291435053e-06, "loss": 1.0399, "step": 21334 }, { "epoch": 0.64, "learning_rate": 1.4951383755621972e-06, "loss": 1.1156, "step": 21335 }, { "epoch": 0.64, "learning_rate": 1.4949150315466876e-06, "loss": 1.082, "step": 21336 }, { "epoch": 0.64, "learning_rate": 1.4946916970991042e-06, "loss": 1.2517, "step": 21337 }, { "epoch": 0.64, "learning_rate": 1.4944683722215704e-06, "loss": 1.1732, "step": 21338 }, { "epoch": 0.64, "learning_rate": 1.4942450569162137e-06, "loss": 1.1021, "step": 21339 }, { "epoch": 0.64, "learning_rate": 1.4940217511851593e-06, "loss": 1.1363, "step": 21340 }, { "epoch": 0.64, "learning_rate": 1.4937984550305345e-06, "loss": 1.0841, "step": 21341 }, { "epoch": 0.64, "learning_rate": 1.4935751684544627e-06, "loss": 1.0851, "step": 21342 }, { "epoch": 0.64, "learning_rate": 1.4933518914590705e-06, "loss": 1.1407, "step": 21343 }, { "epoch": 0.64, "learning_rate": 1.4931286240464837e-06, "loss": 1.0909, "step": 21344 }, { "epoch": 0.64, "learning_rate": 1.4929053662188275e-06, "loss": 1.0966, "step": 21345 }, { "epoch": 0.64, "learning_rate": 1.4926821179782277e-06, "loss": 1.0615, "step": 21346 }, { "epoch": 0.64, "learning_rate": 1.4924588793268085e-06, "loss": 1.1802, "step": 21347 }, { "epoch": 0.64, "learning_rate": 1.4922356502666951e-06, "loss": 1.1042, "step": 21348 }, { "epoch": 0.64, "learning_rate": 1.4920124308000134e-06, "loss": 1.1071, "step": 21349 }, { "epoch": 0.64, "learning_rate": 1.4917892209288886e-06, "loss": 1.1094, "step": 21350 }, { "epoch": 0.64, "learning_rate": 1.4915660206554445e-06, "loss": 0.9904, "step": 21351 }, { "epoch": 0.64, "learning_rate": 1.4913428299818055e-06, "loss": 1.0706, "step": 21352 }, { "epoch": 0.64, "learning_rate": 1.491119648910097e-06, "loss": 1.0936, "step": 21353 }, { "epoch": 0.64, "learning_rate": 1.490896477442445e-06, "loss": 1.1257, "step": 21354 }, { "epoch": 0.64, "learning_rate": 1.490673315580971e-06, "loss": 1.1486, "step": 21355 }, { "epoch": 0.64, "learning_rate": 1.4904501633278012e-06, "loss": 1.0543, "step": 21356 }, { "epoch": 0.64, "learning_rate": 1.49022702068506e-06, "loss": 1.0978, "step": 21357 }, { "epoch": 0.64, "learning_rate": 1.4900038876548705e-06, "loss": 1.1072, "step": 21358 }, { "epoch": 0.64, "learning_rate": 1.4897807642393586e-06, "loss": 1.1077, "step": 21359 }, { "epoch": 0.64, "learning_rate": 1.4895576504406467e-06, "loss": 1.157, "step": 21360 }, { "epoch": 0.64, "learning_rate": 1.489334546260859e-06, "loss": 1.1368, "step": 21361 }, { "epoch": 0.64, "learning_rate": 1.4891114517021204e-06, "loss": 1.0826, "step": 21362 }, { "epoch": 0.64, "learning_rate": 1.488888366766554e-06, "loss": 1.0284, "step": 21363 }, { "epoch": 0.64, "learning_rate": 1.4886652914562827e-06, "loss": 1.0977, "step": 21364 }, { "epoch": 0.64, "learning_rate": 1.488442225773431e-06, "loss": 1.0344, "step": 21365 }, { "epoch": 0.64, "learning_rate": 1.488219169720122e-06, "loss": 1.114, "step": 21366 }, { "epoch": 0.64, "learning_rate": 1.4879961232984802e-06, "loss": 1.0761, "step": 21367 }, { "epoch": 0.64, "learning_rate": 1.4877730865106268e-06, "loss": 1.1209, "step": 21368 }, { "epoch": 0.64, "learning_rate": 1.4875500593586862e-06, "loss": 1.1647, "step": 21369 }, { "epoch": 0.64, "learning_rate": 1.4873270418447816e-06, "loss": 1.0681, "step": 21370 }, { "epoch": 0.64, "learning_rate": 1.4871040339710359e-06, "loss": 0.9935, "step": 21371 }, { "epoch": 0.64, "learning_rate": 1.4868810357395718e-06, "loss": 1.1297, "step": 21372 }, { "epoch": 0.64, "learning_rate": 1.4866580471525128e-06, "loss": 0.9979, "step": 21373 }, { "epoch": 0.64, "learning_rate": 1.4864350682119808e-06, "loss": 1.1487, "step": 21374 }, { "epoch": 0.64, "learning_rate": 1.4862120989200983e-06, "loss": 1.1191, "step": 21375 }, { "epoch": 0.64, "learning_rate": 1.4859891392789893e-06, "loss": 1.2183, "step": 21376 }, { "epoch": 0.64, "learning_rate": 1.4857661892907749e-06, "loss": 1.115, "step": 21377 }, { "epoch": 0.64, "learning_rate": 1.4855432489575777e-06, "loss": 1.1096, "step": 21378 }, { "epoch": 0.64, "learning_rate": 1.48532031828152e-06, "loss": 1.1132, "step": 21379 }, { "epoch": 0.64, "learning_rate": 1.4850973972647253e-06, "loss": 1.1098, "step": 21380 }, { "epoch": 0.64, "learning_rate": 1.4848744859093138e-06, "loss": 1.1718, "step": 21381 }, { "epoch": 0.64, "learning_rate": 1.484651584217408e-06, "loss": 1.1835, "step": 21382 }, { "epoch": 0.64, "learning_rate": 1.4844286921911305e-06, "loss": 1.1038, "step": 21383 }, { "epoch": 0.64, "learning_rate": 1.4842058098326024e-06, "loss": 1.0993, "step": 21384 }, { "epoch": 0.64, "learning_rate": 1.4839829371439468e-06, "loss": 1.0686, "step": 21385 }, { "epoch": 0.64, "learning_rate": 1.4837600741272833e-06, "loss": 1.1786, "step": 21386 }, { "epoch": 0.64, "learning_rate": 1.4835372207847345e-06, "loss": 1.1177, "step": 21387 }, { "epoch": 0.64, "learning_rate": 1.483314377118422e-06, "loss": 1.0613, "step": 21388 }, { "epoch": 0.64, "learning_rate": 1.4830915431304672e-06, "loss": 1.1493, "step": 21389 }, { "epoch": 0.64, "learning_rate": 1.4828687188229906e-06, "loss": 1.0127, "step": 21390 }, { "epoch": 0.64, "learning_rate": 1.4826459041981145e-06, "loss": 1.1812, "step": 21391 }, { "epoch": 0.64, "learning_rate": 1.4824230992579588e-06, "loss": 1.1669, "step": 21392 }, { "epoch": 0.64, "learning_rate": 1.4822003040046462e-06, "loss": 1.1923, "step": 21393 }, { "epoch": 0.64, "learning_rate": 1.4819775184402957e-06, "loss": 1.0456, "step": 21394 }, { "epoch": 0.64, "learning_rate": 1.481754742567029e-06, "loss": 1.2462, "step": 21395 }, { "epoch": 0.64, "learning_rate": 1.4815319763869664e-06, "loss": 1.082, "step": 21396 }, { "epoch": 0.64, "learning_rate": 1.4813092199022294e-06, "loss": 1.0818, "step": 21397 }, { "epoch": 0.64, "learning_rate": 1.4810864731149386e-06, "loss": 1.2225, "step": 21398 }, { "epoch": 0.64, "learning_rate": 1.4808637360272129e-06, "loss": 1.1054, "step": 21399 }, { "epoch": 0.64, "learning_rate": 1.4806410086411738e-06, "loss": 1.2247, "step": 21400 }, { "epoch": 0.64, "learning_rate": 1.480418290958941e-06, "loss": 1.1304, "step": 21401 }, { "epoch": 0.64, "learning_rate": 1.4801955829826358e-06, "loss": 1.1899, "step": 21402 }, { "epoch": 0.64, "learning_rate": 1.479972884714377e-06, "loss": 1.0921, "step": 21403 }, { "epoch": 0.64, "learning_rate": 1.479750196156285e-06, "loss": 1.0861, "step": 21404 }, { "epoch": 0.64, "learning_rate": 1.4795275173104795e-06, "loss": 1.2115, "step": 21405 }, { "epoch": 0.64, "learning_rate": 1.479304848179082e-06, "loss": 1.2563, "step": 21406 }, { "epoch": 0.64, "learning_rate": 1.4790821887642096e-06, "loss": 1.0446, "step": 21407 }, { "epoch": 0.64, "learning_rate": 1.478859539067983e-06, "loss": 1.1635, "step": 21408 }, { "epoch": 0.64, "learning_rate": 1.4786368990925219e-06, "loss": 1.0587, "step": 21409 }, { "epoch": 0.64, "learning_rate": 1.4784142688399456e-06, "loss": 1.0146, "step": 21410 }, { "epoch": 0.65, "learning_rate": 1.4781916483123742e-06, "loss": 1.1034, "step": 21411 }, { "epoch": 0.65, "learning_rate": 1.4779690375119254e-06, "loss": 1.2753, "step": 21412 }, { "epoch": 0.65, "learning_rate": 1.4777464364407192e-06, "loss": 1.0294, "step": 21413 }, { "epoch": 0.65, "learning_rate": 1.4775238451008745e-06, "loss": 1.0788, "step": 21414 }, { "epoch": 0.65, "learning_rate": 1.477301263494511e-06, "loss": 1.222, "step": 21415 }, { "epoch": 0.65, "learning_rate": 1.4770786916237463e-06, "loss": 1.1208, "step": 21416 }, { "epoch": 0.65, "learning_rate": 1.4768561294906997e-06, "loss": 1.2162, "step": 21417 }, { "epoch": 0.65, "learning_rate": 1.4766335770974902e-06, "loss": 1.1058, "step": 21418 }, { "epoch": 0.65, "learning_rate": 1.4764110344462368e-06, "loss": 1.2372, "step": 21419 }, { "epoch": 0.65, "learning_rate": 1.4761885015390571e-06, "loss": 1.09, "step": 21420 }, { "epoch": 0.65, "learning_rate": 1.4759659783780689e-06, "loss": 1.0753, "step": 21421 }, { "epoch": 0.65, "learning_rate": 1.4757434649653918e-06, "loss": 1.0963, "step": 21422 }, { "epoch": 0.65, "learning_rate": 1.4755209613031438e-06, "loss": 1.0663, "step": 21423 }, { "epoch": 0.65, "learning_rate": 1.4752984673934438e-06, "loss": 1.1446, "step": 21424 }, { "epoch": 0.65, "learning_rate": 1.4750759832384077e-06, "loss": 1.0482, "step": 21425 }, { "epoch": 0.65, "learning_rate": 1.4748535088401544e-06, "loss": 1.0969, "step": 21426 }, { "epoch": 0.65, "learning_rate": 1.474631044200802e-06, "loss": 1.0958, "step": 21427 }, { "epoch": 0.65, "learning_rate": 1.4744085893224694e-06, "loss": 1.0448, "step": 21428 }, { "epoch": 0.65, "learning_rate": 1.4741861442072719e-06, "loss": 1.2139, "step": 21429 }, { "epoch": 0.65, "learning_rate": 1.4739637088573287e-06, "loss": 1.2521, "step": 21430 }, { "epoch": 0.65, "learning_rate": 1.4737412832747566e-06, "loss": 1.1701, "step": 21431 }, { "epoch": 0.65, "learning_rate": 1.4735188674616741e-06, "loss": 1.1063, "step": 21432 }, { "epoch": 0.65, "learning_rate": 1.4732964614201969e-06, "loss": 1.1387, "step": 21433 }, { "epoch": 0.65, "learning_rate": 1.4730740651524428e-06, "loss": 1.0665, "step": 21434 }, { "epoch": 0.65, "learning_rate": 1.472851678660529e-06, "loss": 0.9996, "step": 21435 }, { "epoch": 0.65, "learning_rate": 1.4726293019465726e-06, "loss": 1.1509, "step": 21436 }, { "epoch": 0.65, "learning_rate": 1.4724069350126912e-06, "loss": 1.3235, "step": 21437 }, { "epoch": 0.65, "learning_rate": 1.472184577861e-06, "loss": 1.2469, "step": 21438 }, { "epoch": 0.65, "learning_rate": 1.4719622304936168e-06, "loss": 1.0642, "step": 21439 }, { "epoch": 0.65, "learning_rate": 1.471739892912658e-06, "loss": 1.1248, "step": 21440 }, { "epoch": 0.65, "learning_rate": 1.4715175651202404e-06, "loss": 1.1527, "step": 21441 }, { "epoch": 0.65, "learning_rate": 1.47129524711848e-06, "loss": 1.0427, "step": 21442 }, { "epoch": 0.65, "learning_rate": 1.4710729389094932e-06, "loss": 1.1852, "step": 21443 }, { "epoch": 0.65, "learning_rate": 1.4708506404953968e-06, "loss": 1.1135, "step": 21444 }, { "epoch": 0.65, "learning_rate": 1.4706283518783073e-06, "loss": 1.1337, "step": 21445 }, { "epoch": 0.65, "learning_rate": 1.4704060730603393e-06, "loss": 1.123, "step": 21446 }, { "epoch": 0.65, "learning_rate": 1.4701838040436095e-06, "loss": 1.1781, "step": 21447 }, { "epoch": 0.65, "learning_rate": 1.469961544830234e-06, "loss": 1.2107, "step": 21448 }, { "epoch": 0.65, "learning_rate": 1.469739295422329e-06, "loss": 1.0204, "step": 21449 }, { "epoch": 0.65, "learning_rate": 1.4695170558220101e-06, "loss": 1.1013, "step": 21450 }, { "epoch": 0.65, "learning_rate": 1.4692948260313916e-06, "loss": 1.1091, "step": 21451 }, { "epoch": 0.65, "learning_rate": 1.4690726060525901e-06, "loss": 1.1129, "step": 21452 }, { "epoch": 0.65, "learning_rate": 1.4688503958877206e-06, "loss": 1.1083, "step": 21453 }, { "epoch": 0.65, "learning_rate": 1.4686281955388992e-06, "loss": 1.0267, "step": 21454 }, { "epoch": 0.65, "learning_rate": 1.4684060050082404e-06, "loss": 1.0926, "step": 21455 }, { "epoch": 0.65, "learning_rate": 1.4681838242978602e-06, "loss": 1.106, "step": 21456 }, { "epoch": 0.65, "learning_rate": 1.4679616534098723e-06, "loss": 1.1421, "step": 21457 }, { "epoch": 0.65, "learning_rate": 1.4677394923463933e-06, "loss": 1.1133, "step": 21458 }, { "epoch": 0.65, "learning_rate": 1.4675173411095362e-06, "loss": 1.0513, "step": 21459 }, { "epoch": 0.65, "learning_rate": 1.467295199701417e-06, "loss": 1.0532, "step": 21460 }, { "epoch": 0.65, "learning_rate": 1.46707306812415e-06, "loss": 1.1122, "step": 21461 }, { "epoch": 0.65, "learning_rate": 1.4668509463798503e-06, "loss": 1.007, "step": 21462 }, { "epoch": 0.65, "learning_rate": 1.4666288344706325e-06, "loss": 1.2643, "step": 21463 }, { "epoch": 0.65, "learning_rate": 1.4664067323986098e-06, "loss": 1.1678, "step": 21464 }, { "epoch": 0.65, "learning_rate": 1.4661846401658971e-06, "loss": 1.192, "step": 21465 }, { "epoch": 0.65, "learning_rate": 1.465962557774609e-06, "loss": 1.0474, "step": 21466 }, { "epoch": 0.65, "learning_rate": 1.4657404852268598e-06, "loss": 1.1129, "step": 21467 }, { "epoch": 0.65, "learning_rate": 1.4655184225247626e-06, "loss": 1.1525, "step": 21468 }, { "epoch": 0.65, "learning_rate": 1.4652963696704315e-06, "loss": 1.0814, "step": 21469 }, { "epoch": 0.65, "learning_rate": 1.4650743266659805e-06, "loss": 1.087, "step": 21470 }, { "epoch": 0.65, "learning_rate": 1.4648522935135243e-06, "loss": 1.0626, "step": 21471 }, { "epoch": 0.65, "learning_rate": 1.464630270215175e-06, "loss": 1.1314, "step": 21472 }, { "epoch": 0.65, "learning_rate": 1.464408256773047e-06, "loss": 1.0504, "step": 21473 }, { "epoch": 0.65, "learning_rate": 1.4641862531892537e-06, "loss": 1.1072, "step": 21474 }, { "epoch": 0.65, "learning_rate": 1.463964259465908e-06, "loss": 1.0901, "step": 21475 }, { "epoch": 0.65, "learning_rate": 1.463742275605125e-06, "loss": 1.0791, "step": 21476 }, { "epoch": 0.65, "learning_rate": 1.4635203016090155e-06, "loss": 0.9982, "step": 21477 }, { "epoch": 0.65, "learning_rate": 1.4632983374796932e-06, "loss": 0.9771, "step": 21478 }, { "epoch": 0.65, "learning_rate": 1.4630763832192718e-06, "loss": 1.1057, "step": 21479 }, { "epoch": 0.65, "learning_rate": 1.4628544388298643e-06, "loss": 1.1419, "step": 21480 }, { "epoch": 0.65, "learning_rate": 1.4626325043135825e-06, "loss": 1.1848, "step": 21481 }, { "epoch": 0.65, "learning_rate": 1.4624105796725396e-06, "loss": 1.058, "step": 21482 }, { "epoch": 0.65, "learning_rate": 1.4621886649088483e-06, "loss": 1.079, "step": 21483 }, { "epoch": 0.65, "learning_rate": 1.4619667600246212e-06, "loss": 0.9909, "step": 21484 }, { "epoch": 0.65, "learning_rate": 1.4617448650219707e-06, "loss": 1.0281, "step": 21485 }, { "epoch": 0.65, "learning_rate": 1.4615229799030084e-06, "loss": 1.126, "step": 21486 }, { "epoch": 0.65, "learning_rate": 1.4613011046698477e-06, "loss": 1.1345, "step": 21487 }, { "epoch": 0.65, "learning_rate": 1.4610792393245998e-06, "loss": 1.1058, "step": 21488 }, { "epoch": 0.65, "learning_rate": 1.4608573838693785e-06, "loss": 1.075, "step": 21489 }, { "epoch": 0.65, "learning_rate": 1.4606355383062937e-06, "loss": 1.1663, "step": 21490 }, { "epoch": 0.65, "learning_rate": 1.4604137026374577e-06, "loss": 1.1411, "step": 21491 }, { "epoch": 0.65, "learning_rate": 1.4601918768649822e-06, "loss": 1.2051, "step": 21492 }, { "epoch": 0.65, "learning_rate": 1.4599700609909805e-06, "loss": 1.3143, "step": 21493 }, { "epoch": 0.65, "learning_rate": 1.4597482550175624e-06, "loss": 1.1724, "step": 21494 }, { "epoch": 0.65, "learning_rate": 1.4595264589468388e-06, "loss": 1.0911, "step": 21495 }, { "epoch": 0.65, "learning_rate": 1.4593046727809228e-06, "loss": 1.012, "step": 21496 }, { "epoch": 0.65, "learning_rate": 1.4590828965219262e-06, "loss": 1.0066, "step": 21497 }, { "epoch": 0.65, "learning_rate": 1.458861130171958e-06, "loss": 1.0403, "step": 21498 }, { "epoch": 0.65, "learning_rate": 1.4586393737331306e-06, "loss": 1.1226, "step": 21499 }, { "epoch": 0.65, "learning_rate": 1.4584176272075548e-06, "loss": 1.0718, "step": 21500 }, { "epoch": 0.65, "learning_rate": 1.4581958905973414e-06, "loss": 1.1051, "step": 21501 }, { "epoch": 0.65, "learning_rate": 1.4579741639046024e-06, "loss": 1.1608, "step": 21502 }, { "epoch": 0.65, "learning_rate": 1.4577524471314468e-06, "loss": 1.1067, "step": 21503 }, { "epoch": 0.65, "learning_rate": 1.4575307402799854e-06, "loss": 1.1649, "step": 21504 }, { "epoch": 0.65, "learning_rate": 1.4573090433523298e-06, "loss": 1.1926, "step": 21505 }, { "epoch": 0.65, "learning_rate": 1.4570873563505908e-06, "loss": 1.1713, "step": 21506 }, { "epoch": 0.65, "learning_rate": 1.4568656792768767e-06, "loss": 1.0722, "step": 21507 }, { "epoch": 0.65, "learning_rate": 1.4566440121332992e-06, "loss": 1.1777, "step": 21508 }, { "epoch": 0.65, "learning_rate": 1.456422354921968e-06, "loss": 1.134, "step": 21509 }, { "epoch": 0.65, "learning_rate": 1.4562007076449945e-06, "loss": 1.0397, "step": 21510 }, { "epoch": 0.65, "learning_rate": 1.4559790703044863e-06, "loss": 1.0125, "step": 21511 }, { "epoch": 0.65, "learning_rate": 1.4557574429025548e-06, "loss": 1.1487, "step": 21512 }, { "epoch": 0.65, "learning_rate": 1.4555358254413094e-06, "loss": 1.0579, "step": 21513 }, { "epoch": 0.65, "learning_rate": 1.4553142179228607e-06, "loss": 0.9883, "step": 21514 }, { "epoch": 0.65, "learning_rate": 1.455092620349317e-06, "loss": 1.0524, "step": 21515 }, { "epoch": 0.65, "learning_rate": 1.454871032722788e-06, "loss": 1.1819, "step": 21516 }, { "epoch": 0.65, "learning_rate": 1.4546494550453835e-06, "loss": 1.0917, "step": 21517 }, { "epoch": 0.65, "learning_rate": 1.4544278873192125e-06, "loss": 1.2809, "step": 21518 }, { "epoch": 0.65, "learning_rate": 1.454206329546385e-06, "loss": 1.2023, "step": 21519 }, { "epoch": 0.65, "learning_rate": 1.453984781729009e-06, "loss": 1.0003, "step": 21520 }, { "epoch": 0.65, "learning_rate": 1.4537632438691946e-06, "loss": 1.0832, "step": 21521 }, { "epoch": 0.65, "learning_rate": 1.4535417159690495e-06, "loss": 1.1504, "step": 21522 }, { "epoch": 0.65, "learning_rate": 1.453320198030685e-06, "loss": 1.1166, "step": 21523 }, { "epoch": 0.65, "learning_rate": 1.4530986900562066e-06, "loss": 1.1452, "step": 21524 }, { "epoch": 0.65, "learning_rate": 1.4528771920477248e-06, "loss": 1.1278, "step": 21525 }, { "epoch": 0.65, "learning_rate": 1.4526557040073477e-06, "loss": 1.0999, "step": 21526 }, { "epoch": 0.65, "learning_rate": 1.4524342259371848e-06, "loss": 1.0555, "step": 21527 }, { "epoch": 0.65, "learning_rate": 1.452212757839343e-06, "loss": 1.1238, "step": 21528 }, { "epoch": 0.65, "learning_rate": 1.4519912997159308e-06, "loss": 1.0112, "step": 21529 }, { "epoch": 0.65, "learning_rate": 1.4517698515690565e-06, "loss": 1.1058, "step": 21530 }, { "epoch": 0.65, "learning_rate": 1.4515484134008284e-06, "loss": 1.2465, "step": 21531 }, { "epoch": 0.65, "learning_rate": 1.4513269852133557e-06, "loss": 1.2156, "step": 21532 }, { "epoch": 0.65, "learning_rate": 1.4511055670087436e-06, "loss": 1.1824, "step": 21533 }, { "epoch": 0.65, "learning_rate": 1.4508841587891021e-06, "loss": 1.0904, "step": 21534 }, { "epoch": 0.65, "learning_rate": 1.4506627605565377e-06, "loss": 1.1708, "step": 21535 }, { "epoch": 0.65, "learning_rate": 1.4504413723131594e-06, "loss": 1.059, "step": 21536 }, { "epoch": 0.65, "learning_rate": 1.4502199940610728e-06, "loss": 1.1003, "step": 21537 }, { "epoch": 0.65, "learning_rate": 1.4499986258023863e-06, "loss": 1.059, "step": 21538 }, { "epoch": 0.65, "learning_rate": 1.4497772675392069e-06, "loss": 1.1541, "step": 21539 }, { "epoch": 0.65, "learning_rate": 1.4495559192736437e-06, "loss": 1.1422, "step": 21540 }, { "epoch": 0.65, "learning_rate": 1.4493345810078008e-06, "loss": 1.1444, "step": 21541 }, { "epoch": 0.65, "learning_rate": 1.4491132527437864e-06, "loss": 1.0177, "step": 21542 }, { "epoch": 0.65, "learning_rate": 1.4488919344837083e-06, "loss": 1.054, "step": 21543 }, { "epoch": 0.65, "learning_rate": 1.4486706262296723e-06, "loss": 1.1775, "step": 21544 }, { "epoch": 0.65, "learning_rate": 1.4484493279837859e-06, "loss": 1.1412, "step": 21545 }, { "epoch": 0.65, "learning_rate": 1.4482280397481551e-06, "loss": 1.0535, "step": 21546 }, { "epoch": 0.65, "learning_rate": 1.4480067615248873e-06, "loss": 1.2416, "step": 21547 }, { "epoch": 0.65, "learning_rate": 1.4477854933160885e-06, "loss": 1.1082, "step": 21548 }, { "epoch": 0.65, "learning_rate": 1.4475642351238655e-06, "loss": 1.1809, "step": 21549 }, { "epoch": 0.65, "learning_rate": 1.4473429869503235e-06, "loss": 1.0695, "step": 21550 }, { "epoch": 0.65, "learning_rate": 1.4471217487975692e-06, "loss": 1.008, "step": 21551 }, { "epoch": 0.65, "learning_rate": 1.446900520667709e-06, "loss": 1.1248, "step": 21552 }, { "epoch": 0.65, "learning_rate": 1.4466793025628489e-06, "loss": 1.1219, "step": 21553 }, { "epoch": 0.65, "learning_rate": 1.4464580944850941e-06, "loss": 1.1802, "step": 21554 }, { "epoch": 0.65, "learning_rate": 1.4462368964365509e-06, "loss": 1.2363, "step": 21555 }, { "epoch": 0.65, "learning_rate": 1.446015708419325e-06, "loss": 1.0302, "step": 21556 }, { "epoch": 0.65, "learning_rate": 1.4457945304355217e-06, "loss": 1.2061, "step": 21557 }, { "epoch": 0.65, "learning_rate": 1.4455733624872478e-06, "loss": 1.0563, "step": 21558 }, { "epoch": 0.65, "learning_rate": 1.4453522045766067e-06, "loss": 1.09, "step": 21559 }, { "epoch": 0.65, "learning_rate": 1.4451310567057048e-06, "loss": 1.0843, "step": 21560 }, { "epoch": 0.65, "learning_rate": 1.4449099188766468e-06, "loss": 1.1281, "step": 21561 }, { "epoch": 0.65, "learning_rate": 1.4446887910915397e-06, "loss": 1.1383, "step": 21562 }, { "epoch": 0.65, "learning_rate": 1.4444676733524856e-06, "loss": 1.0894, "step": 21563 }, { "epoch": 0.65, "learning_rate": 1.444246565661591e-06, "loss": 1.1583, "step": 21564 }, { "epoch": 0.65, "learning_rate": 1.4440254680209608e-06, "loss": 1.1042, "step": 21565 }, { "epoch": 0.65, "learning_rate": 1.4438043804327007e-06, "loss": 1.0043, "step": 21566 }, { "epoch": 0.65, "learning_rate": 1.443583302898913e-06, "loss": 1.1014, "step": 21567 }, { "epoch": 0.65, "learning_rate": 1.4433622354217035e-06, "loss": 1.0665, "step": 21568 }, { "epoch": 0.65, "learning_rate": 1.4431411780031765e-06, "loss": 1.0561, "step": 21569 }, { "epoch": 0.65, "learning_rate": 1.4429201306454365e-06, "loss": 1.1228, "step": 21570 }, { "epoch": 0.65, "learning_rate": 1.442699093350588e-06, "loss": 1.0413, "step": 21571 }, { "epoch": 0.65, "learning_rate": 1.442478066120735e-06, "loss": 1.1321, "step": 21572 }, { "epoch": 0.65, "learning_rate": 1.4422570489579813e-06, "loss": 1.1136, "step": 21573 }, { "epoch": 0.65, "learning_rate": 1.442036041864432e-06, "loss": 1.1264, "step": 21574 }, { "epoch": 0.65, "learning_rate": 1.4418150448421888e-06, "loss": 1.1796, "step": 21575 }, { "epoch": 0.65, "learning_rate": 1.441594057893357e-06, "loss": 1.0645, "step": 21576 }, { "epoch": 0.65, "learning_rate": 1.44137308102004e-06, "loss": 1.0026, "step": 21577 }, { "epoch": 0.65, "learning_rate": 1.4411521142243415e-06, "loss": 1.0634, "step": 21578 }, { "epoch": 0.65, "learning_rate": 1.440931157508366e-06, "loss": 1.0205, "step": 21579 }, { "epoch": 0.65, "learning_rate": 1.4407102108742147e-06, "loss": 1.1944, "step": 21580 }, { "epoch": 0.65, "learning_rate": 1.4404892743239919e-06, "loss": 1.0682, "step": 21581 }, { "epoch": 0.65, "learning_rate": 1.4402683478598012e-06, "loss": 1.0659, "step": 21582 }, { "epoch": 0.65, "learning_rate": 1.4400474314837452e-06, "loss": 1.1257, "step": 21583 }, { "epoch": 0.65, "learning_rate": 1.4398265251979282e-06, "loss": 1.0432, "step": 21584 }, { "epoch": 0.65, "learning_rate": 1.439605629004451e-06, "loss": 1.1778, "step": 21585 }, { "epoch": 0.65, "learning_rate": 1.4393847429054175e-06, "loss": 1.1898, "step": 21586 }, { "epoch": 0.65, "learning_rate": 1.4391638669029307e-06, "loss": 1.0408, "step": 21587 }, { "epoch": 0.65, "learning_rate": 1.438943000999094e-06, "loss": 1.1777, "step": 21588 }, { "epoch": 0.65, "learning_rate": 1.4387221451960077e-06, "loss": 1.114, "step": 21589 }, { "epoch": 0.65, "learning_rate": 1.4385012994957754e-06, "loss": 1.106, "step": 21590 }, { "epoch": 0.65, "learning_rate": 1.4382804639004996e-06, "loss": 1.1978, "step": 21591 }, { "epoch": 0.65, "learning_rate": 1.4380596384122835e-06, "loss": 1.1941, "step": 21592 }, { "epoch": 0.65, "learning_rate": 1.437838823033227e-06, "loss": 1.2332, "step": 21593 }, { "epoch": 0.65, "learning_rate": 1.4376180177654336e-06, "loss": 1.2145, "step": 21594 }, { "epoch": 0.65, "learning_rate": 1.437397222611005e-06, "loss": 1.1288, "step": 21595 }, { "epoch": 0.65, "learning_rate": 1.4371764375720426e-06, "loss": 1.074, "step": 21596 }, { "epoch": 0.65, "learning_rate": 1.4369556626506503e-06, "loss": 1.0961, "step": 21597 }, { "epoch": 0.65, "learning_rate": 1.4367348978489265e-06, "loss": 1.0902, "step": 21598 }, { "epoch": 0.65, "learning_rate": 1.436514143168975e-06, "loss": 1.169, "step": 21599 }, { "epoch": 0.65, "learning_rate": 1.4362933986128962e-06, "loss": 1.2319, "step": 21600 }, { "epoch": 0.65, "learning_rate": 1.436072664182792e-06, "loss": 1.1069, "step": 21601 }, { "epoch": 0.65, "learning_rate": 1.4358519398807638e-06, "loss": 1.0562, "step": 21602 }, { "epoch": 0.65, "learning_rate": 1.4356312257089127e-06, "loss": 1.186, "step": 21603 }, { "epoch": 0.65, "learning_rate": 1.4354105216693396e-06, "loss": 0.959, "step": 21604 }, { "epoch": 0.65, "learning_rate": 1.4351898277641466e-06, "loss": 1.1465, "step": 21605 }, { "epoch": 0.65, "learning_rate": 1.4349691439954325e-06, "loss": 1.1479, "step": 21606 }, { "epoch": 0.65, "learning_rate": 1.4347484703652991e-06, "loss": 1.0832, "step": 21607 }, { "epoch": 0.65, "learning_rate": 1.4345278068758478e-06, "loss": 1.1216, "step": 21608 }, { "epoch": 0.65, "learning_rate": 1.434307153529178e-06, "loss": 0.9929, "step": 21609 }, { "epoch": 0.65, "learning_rate": 1.4340865103273921e-06, "loss": 1.1166, "step": 21610 }, { "epoch": 0.65, "learning_rate": 1.4338658772725883e-06, "loss": 1.0844, "step": 21611 }, { "epoch": 0.65, "learning_rate": 1.4336452543668677e-06, "loss": 1.188, "step": 21612 }, { "epoch": 0.65, "learning_rate": 1.433424641612331e-06, "loss": 1.069, "step": 21613 }, { "epoch": 0.65, "learning_rate": 1.433204039011079e-06, "loss": 1.1224, "step": 21614 }, { "epoch": 0.65, "learning_rate": 1.4329834465652096e-06, "loss": 1.0854, "step": 21615 }, { "epoch": 0.65, "learning_rate": 1.4327628642768237e-06, "loss": 1.0977, "step": 21616 }, { "epoch": 0.65, "learning_rate": 1.4325422921480217e-06, "loss": 1.1626, "step": 21617 }, { "epoch": 0.65, "learning_rate": 1.4323217301809039e-06, "loss": 1.123, "step": 21618 }, { "epoch": 0.65, "learning_rate": 1.432101178377568e-06, "loss": 1.1139, "step": 21619 }, { "epoch": 0.65, "learning_rate": 1.4318806367401144e-06, "loss": 1.101, "step": 21620 }, { "epoch": 0.65, "learning_rate": 1.4316601052706431e-06, "loss": 1.2014, "step": 21621 }, { "epoch": 0.65, "learning_rate": 1.4314395839712525e-06, "loss": 1.1299, "step": 21622 }, { "epoch": 0.65, "learning_rate": 1.4312190728440439e-06, "loss": 1.1006, "step": 21623 }, { "epoch": 0.65, "learning_rate": 1.4309985718911138e-06, "loss": 1.1106, "step": 21624 }, { "epoch": 0.65, "learning_rate": 1.4307780811145624e-06, "loss": 1.0977, "step": 21625 }, { "epoch": 0.65, "learning_rate": 1.430557600516489e-06, "loss": 1.1127, "step": 21626 }, { "epoch": 0.65, "learning_rate": 1.4303371300989916e-06, "loss": 1.0963, "step": 21627 }, { "epoch": 0.65, "learning_rate": 1.43011666986417e-06, "loss": 1.0229, "step": 21628 }, { "epoch": 0.65, "learning_rate": 1.4298962198141225e-06, "loss": 1.0469, "step": 21629 }, { "epoch": 0.65, "learning_rate": 1.4296757799509473e-06, "loss": 1.0391, "step": 21630 }, { "epoch": 0.65, "learning_rate": 1.4294553502767444e-06, "loss": 1.292, "step": 21631 }, { "epoch": 0.65, "learning_rate": 1.4292349307936098e-06, "loss": 1.0104, "step": 21632 }, { "epoch": 0.65, "learning_rate": 1.4290145215036433e-06, "loss": 1.2483, "step": 21633 }, { "epoch": 0.65, "learning_rate": 1.4287941224089425e-06, "loss": 1.0263, "step": 21634 }, { "epoch": 0.65, "learning_rate": 1.4285737335116057e-06, "loss": 1.0942, "step": 21635 }, { "epoch": 0.65, "learning_rate": 1.4283533548137318e-06, "loss": 1.2088, "step": 21636 }, { "epoch": 0.65, "learning_rate": 1.428132986317417e-06, "loss": 1.1345, "step": 21637 }, { "epoch": 0.65, "learning_rate": 1.4279126280247602e-06, "loss": 1.1345, "step": 21638 }, { "epoch": 0.65, "learning_rate": 1.4276922799378583e-06, "loss": 1.0701, "step": 21639 }, { "epoch": 0.65, "learning_rate": 1.4274719420588112e-06, "loss": 1.0123, "step": 21640 }, { "epoch": 0.65, "learning_rate": 1.427251614389713e-06, "loss": 1.1551, "step": 21641 }, { "epoch": 0.65, "learning_rate": 1.4270312969326632e-06, "loss": 1.1625, "step": 21642 }, { "epoch": 0.65, "learning_rate": 1.4268109896897586e-06, "loss": 1.1811, "step": 21643 }, { "epoch": 0.65, "learning_rate": 1.4265906926630973e-06, "loss": 0.9387, "step": 21644 }, { "epoch": 0.65, "learning_rate": 1.4263704058547747e-06, "loss": 1.1927, "step": 21645 }, { "epoch": 0.65, "learning_rate": 1.426150129266889e-06, "loss": 1.1199, "step": 21646 }, { "epoch": 0.65, "learning_rate": 1.4259298629015366e-06, "loss": 1.0677, "step": 21647 }, { "epoch": 0.65, "learning_rate": 1.4257096067608144e-06, "loss": 1.1303, "step": 21648 }, { "epoch": 0.65, "learning_rate": 1.4254893608468209e-06, "loss": 1.0851, "step": 21649 }, { "epoch": 0.65, "learning_rate": 1.4252691251616502e-06, "loss": 1.2503, "step": 21650 }, { "epoch": 0.65, "learning_rate": 1.4250488997073995e-06, "loss": 1.1469, "step": 21651 }, { "epoch": 0.65, "learning_rate": 1.4248286844861655e-06, "loss": 1.0989, "step": 21652 }, { "epoch": 0.65, "learning_rate": 1.4246084795000447e-06, "loss": 1.1353, "step": 21653 }, { "epoch": 0.65, "learning_rate": 1.4243882847511333e-06, "loss": 1.1658, "step": 21654 }, { "epoch": 0.65, "learning_rate": 1.4241681002415276e-06, "loss": 1.2148, "step": 21655 }, { "epoch": 0.65, "learning_rate": 1.423947925973324e-06, "loss": 1.1881, "step": 21656 }, { "epoch": 0.65, "learning_rate": 1.4237277619486172e-06, "loss": 1.0336, "step": 21657 }, { "epoch": 0.65, "learning_rate": 1.4235076081695037e-06, "loss": 1.0765, "step": 21658 }, { "epoch": 0.65, "learning_rate": 1.4232874646380793e-06, "loss": 1.2109, "step": 21659 }, { "epoch": 0.65, "learning_rate": 1.4230673313564397e-06, "loss": 1.0485, "step": 21660 }, { "epoch": 0.65, "learning_rate": 1.4228472083266804e-06, "loss": 1.1961, "step": 21661 }, { "epoch": 0.65, "learning_rate": 1.422627095550898e-06, "loss": 1.1752, "step": 21662 }, { "epoch": 0.65, "learning_rate": 1.4224069930311856e-06, "loss": 1.0839, "step": 21663 }, { "epoch": 0.65, "learning_rate": 1.4221869007696398e-06, "loss": 1.0938, "step": 21664 }, { "epoch": 0.65, "learning_rate": 1.4219668187683555e-06, "loss": 1.1721, "step": 21665 }, { "epoch": 0.65, "learning_rate": 1.4217467470294288e-06, "loss": 1.0353, "step": 21666 }, { "epoch": 0.65, "learning_rate": 1.4215266855549531e-06, "loss": 1.1561, "step": 21667 }, { "epoch": 0.65, "learning_rate": 1.4213066343470237e-06, "loss": 1.0323, "step": 21668 }, { "epoch": 0.65, "learning_rate": 1.4210865934077356e-06, "loss": 1.1326, "step": 21669 }, { "epoch": 0.65, "learning_rate": 1.4208665627391843e-06, "loss": 1.0997, "step": 21670 }, { "epoch": 0.65, "learning_rate": 1.4206465423434628e-06, "loss": 1.14, "step": 21671 }, { "epoch": 0.65, "learning_rate": 1.4204265322226668e-06, "loss": 1.0403, "step": 21672 }, { "epoch": 0.65, "learning_rate": 1.4202065323788899e-06, "loss": 1.1093, "step": 21673 }, { "epoch": 0.65, "learning_rate": 1.4199865428142268e-06, "loss": 1.0549, "step": 21674 }, { "epoch": 0.65, "learning_rate": 1.4197665635307725e-06, "loss": 1.1633, "step": 21675 }, { "epoch": 0.65, "learning_rate": 1.4195465945306195e-06, "loss": 1.0873, "step": 21676 }, { "epoch": 0.65, "learning_rate": 1.4193266358158624e-06, "loss": 1.1512, "step": 21677 }, { "epoch": 0.65, "learning_rate": 1.4191066873885953e-06, "loss": 1.0425, "step": 21678 }, { "epoch": 0.65, "learning_rate": 1.418886749250913e-06, "loss": 1.0723, "step": 21679 }, { "epoch": 0.65, "learning_rate": 1.418666821404907e-06, "loss": 1.042, "step": 21680 }, { "epoch": 0.65, "learning_rate": 1.4184469038526721e-06, "loss": 1.0778, "step": 21681 }, { "epoch": 0.65, "learning_rate": 1.418226996596302e-06, "loss": 1.1999, "step": 21682 }, { "epoch": 0.65, "learning_rate": 1.4180070996378898e-06, "loss": 1.0931, "step": 21683 }, { "epoch": 0.65, "learning_rate": 1.417787212979529e-06, "loss": 1.0596, "step": 21684 }, { "epoch": 0.65, "learning_rate": 1.4175673366233126e-06, "loss": 1.1909, "step": 21685 }, { "epoch": 0.65, "learning_rate": 1.4173474705713337e-06, "loss": 1.1431, "step": 21686 }, { "epoch": 0.65, "learning_rate": 1.4171276148256858e-06, "loss": 1.2314, "step": 21687 }, { "epoch": 0.65, "learning_rate": 1.4169077693884623e-06, "loss": 1.1281, "step": 21688 }, { "epoch": 0.65, "learning_rate": 1.416687934261754e-06, "loss": 1.0938, "step": 21689 }, { "epoch": 0.65, "learning_rate": 1.4164681094476552e-06, "loss": 1.1175, "step": 21690 }, { "epoch": 0.65, "learning_rate": 1.4162482949482578e-06, "loss": 1.1384, "step": 21691 }, { "epoch": 0.65, "learning_rate": 1.4160284907656558e-06, "loss": 1.1204, "step": 21692 }, { "epoch": 0.65, "learning_rate": 1.4158086969019396e-06, "loss": 1.1335, "step": 21693 }, { "epoch": 0.65, "learning_rate": 1.4155889133592025e-06, "loss": 1.0405, "step": 21694 }, { "epoch": 0.65, "learning_rate": 1.4153691401395365e-06, "loss": 1.1115, "step": 21695 }, { "epoch": 0.65, "learning_rate": 1.4151493772450349e-06, "loss": 1.1134, "step": 21696 }, { "epoch": 0.65, "learning_rate": 1.4149296246777878e-06, "loss": 1.0109, "step": 21697 }, { "epoch": 0.65, "learning_rate": 1.414709882439888e-06, "loss": 1.1141, "step": 21698 }, { "epoch": 0.65, "learning_rate": 1.4144901505334277e-06, "loss": 1.1794, "step": 21699 }, { "epoch": 0.65, "learning_rate": 1.4142704289604992e-06, "loss": 1.0446, "step": 21700 }, { "epoch": 0.65, "learning_rate": 1.414050717723192e-06, "loss": 1.0269, "step": 21701 }, { "epoch": 0.65, "learning_rate": 1.4138310168235998e-06, "loss": 1.1506, "step": 21702 }, { "epoch": 0.65, "learning_rate": 1.4136113262638123e-06, "loss": 1.1057, "step": 21703 }, { "epoch": 0.65, "learning_rate": 1.4133916460459224e-06, "loss": 1.1001, "step": 21704 }, { "epoch": 0.65, "learning_rate": 1.4131719761720214e-06, "loss": 1.1041, "step": 21705 }, { "epoch": 0.65, "learning_rate": 1.4129523166441985e-06, "loss": 0.975, "step": 21706 }, { "epoch": 0.65, "learning_rate": 1.4127326674645464e-06, "loss": 1.1731, "step": 21707 }, { "epoch": 0.65, "learning_rate": 1.4125130286351553e-06, "loss": 1.132, "step": 21708 }, { "epoch": 0.65, "learning_rate": 1.4122934001581167e-06, "loss": 1.0244, "step": 21709 }, { "epoch": 0.65, "learning_rate": 1.4120737820355214e-06, "loss": 1.0455, "step": 21710 }, { "epoch": 0.65, "learning_rate": 1.4118541742694592e-06, "loss": 1.0729, "step": 21711 }, { "epoch": 0.65, "learning_rate": 1.4116345768620212e-06, "loss": 1.102, "step": 21712 }, { "epoch": 0.65, "learning_rate": 1.411414989815299e-06, "loss": 1.1255, "step": 21713 }, { "epoch": 0.65, "learning_rate": 1.411195413131381e-06, "loss": 1.0981, "step": 21714 }, { "epoch": 0.65, "learning_rate": 1.410975846812358e-06, "loss": 1.1188, "step": 21715 }, { "epoch": 0.65, "learning_rate": 1.4107562908603205e-06, "loss": 1.0496, "step": 21716 }, { "epoch": 0.65, "learning_rate": 1.4105367452773585e-06, "loss": 1.0768, "step": 21717 }, { "epoch": 0.65, "learning_rate": 1.4103172100655631e-06, "loss": 1.1263, "step": 21718 }, { "epoch": 0.65, "learning_rate": 1.410097685227022e-06, "loss": 1.1199, "step": 21719 }, { "epoch": 0.65, "learning_rate": 1.409878170763826e-06, "loss": 0.9967, "step": 21720 }, { "epoch": 0.65, "learning_rate": 1.409658666678065e-06, "loss": 1.1477, "step": 21721 }, { "epoch": 0.65, "learning_rate": 1.409439172971829e-06, "loss": 0.9984, "step": 21722 }, { "epoch": 0.65, "learning_rate": 1.409219689647206e-06, "loss": 1.0424, "step": 21723 }, { "epoch": 0.65, "learning_rate": 1.409000216706286e-06, "loss": 1.1027, "step": 21724 }, { "epoch": 0.65, "learning_rate": 1.408780754151159e-06, "loss": 1.1155, "step": 21725 }, { "epoch": 0.65, "learning_rate": 1.4085613019839146e-06, "loss": 1.1387, "step": 21726 }, { "epoch": 0.65, "learning_rate": 1.4083418602066396e-06, "loss": 1.1438, "step": 21727 }, { "epoch": 0.65, "learning_rate": 1.4081224288214243e-06, "loss": 1.0605, "step": 21728 }, { "epoch": 0.65, "learning_rate": 1.407903007830358e-06, "loss": 1.103, "step": 21729 }, { "epoch": 0.65, "learning_rate": 1.4076835972355287e-06, "loss": 1.1551, "step": 21730 }, { "epoch": 0.65, "learning_rate": 1.4074641970390267e-06, "loss": 1.233, "step": 21731 }, { "epoch": 0.65, "learning_rate": 1.4072448072429384e-06, "loss": 1.0864, "step": 21732 }, { "epoch": 0.65, "learning_rate": 1.407025427849353e-06, "loss": 1.2108, "step": 21733 }, { "epoch": 0.65, "learning_rate": 1.4068060588603593e-06, "loss": 1.0592, "step": 21734 }, { "epoch": 0.65, "learning_rate": 1.4065867002780454e-06, "loss": 1.088, "step": 21735 }, { "epoch": 0.65, "learning_rate": 1.4063673521044997e-06, "loss": 1.0873, "step": 21736 }, { "epoch": 0.65, "learning_rate": 1.4061480143418098e-06, "loss": 1.1811, "step": 21737 }, { "epoch": 0.65, "learning_rate": 1.4059286869920651e-06, "loss": 1.1024, "step": 21738 }, { "epoch": 0.65, "learning_rate": 1.4057093700573516e-06, "loss": 1.0906, "step": 21739 }, { "epoch": 0.65, "learning_rate": 1.4054900635397573e-06, "loss": 1.1167, "step": 21740 }, { "epoch": 0.65, "learning_rate": 1.405270767441371e-06, "loss": 1.0132, "step": 21741 }, { "epoch": 0.65, "learning_rate": 1.4050514817642797e-06, "loss": 1.0354, "step": 21742 }, { "epoch": 0.66, "learning_rate": 1.4048322065105707e-06, "loss": 1.1839, "step": 21743 }, { "epoch": 0.66, "learning_rate": 1.4046129416823328e-06, "loss": 1.1597, "step": 21744 }, { "epoch": 0.66, "learning_rate": 1.404393687281651e-06, "loss": 1.0992, "step": 21745 }, { "epoch": 0.66, "learning_rate": 1.4041744433106135e-06, "loss": 1.0699, "step": 21746 }, { "epoch": 0.66, "learning_rate": 1.403955209771308e-06, "loss": 1.0188, "step": 21747 }, { "epoch": 0.66, "learning_rate": 1.4037359866658218e-06, "loss": 1.0801, "step": 21748 }, { "epoch": 0.66, "learning_rate": 1.4035167739962403e-06, "loss": 1.0478, "step": 21749 }, { "epoch": 0.66, "learning_rate": 1.4032975717646505e-06, "loss": 1.083, "step": 21750 }, { "epoch": 0.66, "learning_rate": 1.4030783799731398e-06, "loss": 1.0345, "step": 21751 }, { "epoch": 0.66, "learning_rate": 1.4028591986237957e-06, "loss": 1.0389, "step": 21752 }, { "epoch": 0.66, "learning_rate": 1.4026400277187025e-06, "loss": 1.0501, "step": 21753 }, { "epoch": 0.66, "learning_rate": 1.4024208672599482e-06, "loss": 1.1294, "step": 21754 }, { "epoch": 0.66, "learning_rate": 1.4022017172496184e-06, "loss": 1.1081, "step": 21755 }, { "epoch": 0.66, "learning_rate": 1.4019825776897992e-06, "loss": 1.0398, "step": 21756 }, { "epoch": 0.66, "learning_rate": 1.401763448582578e-06, "loss": 1.1158, "step": 21757 }, { "epoch": 0.66, "learning_rate": 1.401544329930039e-06, "loss": 1.0705, "step": 21758 }, { "epoch": 0.66, "learning_rate": 1.4013252217342693e-06, "loss": 1.1187, "step": 21759 }, { "epoch": 0.66, "learning_rate": 1.401106123997354e-06, "loss": 1.0393, "step": 21760 }, { "epoch": 0.66, "learning_rate": 1.4008870367213803e-06, "loss": 1.1559, "step": 21761 }, { "epoch": 0.66, "learning_rate": 1.4006679599084317e-06, "loss": 1.3167, "step": 21762 }, { "epoch": 0.66, "learning_rate": 1.4004488935605948e-06, "loss": 1.2136, "step": 21763 }, { "epoch": 0.66, "learning_rate": 1.4002298376799545e-06, "loss": 1.0706, "step": 21764 }, { "epoch": 0.66, "learning_rate": 1.4000107922685966e-06, "loss": 1.0361, "step": 21765 }, { "epoch": 0.66, "learning_rate": 1.3997917573286062e-06, "loss": 1.0223, "step": 21766 }, { "epoch": 0.66, "learning_rate": 1.3995727328620683e-06, "loss": 1.1372, "step": 21767 }, { "epoch": 0.66, "learning_rate": 1.3993537188710683e-06, "loss": 1.1492, "step": 21768 }, { "epoch": 0.66, "learning_rate": 1.3991347153576907e-06, "loss": 1.1835, "step": 21769 }, { "epoch": 0.66, "learning_rate": 1.398915722324021e-06, "loss": 1.0577, "step": 21770 }, { "epoch": 0.66, "learning_rate": 1.3986967397721427e-06, "loss": 1.067, "step": 21771 }, { "epoch": 0.66, "learning_rate": 1.3984777677041412e-06, "loss": 1.1802, "step": 21772 }, { "epoch": 0.66, "learning_rate": 1.3982588061221003e-06, "loss": 1.2358, "step": 21773 }, { "epoch": 0.66, "learning_rate": 1.3980398550281063e-06, "loss": 1.2695, "step": 21774 }, { "epoch": 0.66, "learning_rate": 1.3978209144242411e-06, "loss": 1.0661, "step": 21775 }, { "epoch": 0.66, "learning_rate": 1.39760198431259e-06, "loss": 1.0901, "step": 21776 }, { "epoch": 0.66, "learning_rate": 1.3973830646952372e-06, "loss": 1.0986, "step": 21777 }, { "epoch": 0.66, "learning_rate": 1.3971641555742674e-06, "loss": 1.0065, "step": 21778 }, { "epoch": 0.66, "learning_rate": 1.3969452569517628e-06, "loss": 1.135, "step": 21779 }, { "epoch": 0.66, "learning_rate": 1.396726368829808e-06, "loss": 1.0864, "step": 21780 }, { "epoch": 0.66, "learning_rate": 1.3965074912104871e-06, "loss": 1.202, "step": 21781 }, { "epoch": 0.66, "learning_rate": 1.3962886240958828e-06, "loss": 1.1113, "step": 21782 }, { "epoch": 0.66, "learning_rate": 1.3960697674880807e-06, "loss": 1.1077, "step": 21783 }, { "epoch": 0.66, "learning_rate": 1.3958509213891619e-06, "loss": 1.0208, "step": 21784 }, { "epoch": 0.66, "learning_rate": 1.3956320858012102e-06, "loss": 1.0229, "step": 21785 }, { "epoch": 0.66, "learning_rate": 1.3954132607263094e-06, "loss": 1.0293, "step": 21786 }, { "epoch": 0.66, "learning_rate": 1.395194446166543e-06, "loss": 1.1232, "step": 21787 }, { "epoch": 0.66, "learning_rate": 1.3949756421239926e-06, "loss": 1.1326, "step": 21788 }, { "epoch": 0.66, "learning_rate": 1.3947568486007422e-06, "loss": 1.1039, "step": 21789 }, { "epoch": 0.66, "learning_rate": 1.3945380655988737e-06, "loss": 1.027, "step": 21790 }, { "epoch": 0.66, "learning_rate": 1.3943192931204707e-06, "loss": 1.0039, "step": 21791 }, { "epoch": 0.66, "learning_rate": 1.3941005311676156e-06, "loss": 1.1446, "step": 21792 }, { "epoch": 0.66, "learning_rate": 1.393881779742391e-06, "loss": 1.1526, "step": 21793 }, { "epoch": 0.66, "learning_rate": 1.3936630388468786e-06, "loss": 1.2187, "step": 21794 }, { "epoch": 0.66, "learning_rate": 1.3934443084831616e-06, "loss": 1.102, "step": 21795 }, { "epoch": 0.66, "learning_rate": 1.393225588653323e-06, "loss": 1.0942, "step": 21796 }, { "epoch": 0.66, "learning_rate": 1.3930068793594426e-06, "loss": 1.0642, "step": 21797 }, { "epoch": 0.66, "learning_rate": 1.392788180603603e-06, "loss": 1.194, "step": 21798 }, { "epoch": 0.66, "learning_rate": 1.3925694923878874e-06, "loss": 1.1423, "step": 21799 }, { "epoch": 0.66, "learning_rate": 1.3923508147143777e-06, "loss": 1.1161, "step": 21800 }, { "epoch": 0.66, "learning_rate": 1.3921321475851537e-06, "loss": 1.178, "step": 21801 }, { "epoch": 0.66, "learning_rate": 1.391913491002298e-06, "loss": 1.2031, "step": 21802 }, { "epoch": 0.66, "learning_rate": 1.3916948449678924e-06, "loss": 1.0262, "step": 21803 }, { "epoch": 0.66, "learning_rate": 1.391476209484019e-06, "loss": 1.0876, "step": 21804 }, { "epoch": 0.66, "learning_rate": 1.391257584552757e-06, "loss": 1.1282, "step": 21805 }, { "epoch": 0.66, "learning_rate": 1.3910389701761892e-06, "loss": 1.1269, "step": 21806 }, { "epoch": 0.66, "learning_rate": 1.3908203663563964e-06, "loss": 0.9637, "step": 21807 }, { "epoch": 0.66, "learning_rate": 1.390601773095459e-06, "loss": 1.1152, "step": 21808 }, { "epoch": 0.66, "learning_rate": 1.3903831903954596e-06, "loss": 1.0226, "step": 21809 }, { "epoch": 0.66, "learning_rate": 1.3901646182584768e-06, "loss": 1.1099, "step": 21810 }, { "epoch": 0.66, "learning_rate": 1.3899460566865924e-06, "loss": 1.1729, "step": 21811 }, { "epoch": 0.66, "learning_rate": 1.389727505681887e-06, "loss": 1.0759, "step": 21812 }, { "epoch": 0.66, "learning_rate": 1.389508965246442e-06, "loss": 1.1277, "step": 21813 }, { "epoch": 0.66, "learning_rate": 1.3892904353823355e-06, "loss": 1.1105, "step": 21814 }, { "epoch": 0.66, "learning_rate": 1.3890719160916493e-06, "loss": 1.1357, "step": 21815 }, { "epoch": 0.66, "learning_rate": 1.3888534073764636e-06, "loss": 1.1102, "step": 21816 }, { "epoch": 0.66, "learning_rate": 1.3886349092388585e-06, "loss": 1.1057, "step": 21817 }, { "epoch": 0.66, "learning_rate": 1.3884164216809131e-06, "loss": 1.1038, "step": 21818 }, { "epoch": 0.66, "learning_rate": 1.3881979447047086e-06, "loss": 1.1747, "step": 21819 }, { "epoch": 0.66, "learning_rate": 1.3879794783123252e-06, "loss": 1.0747, "step": 21820 }, { "epoch": 0.66, "learning_rate": 1.3877610225058402e-06, "loss": 1.1096, "step": 21821 }, { "epoch": 0.66, "learning_rate": 1.387542577287335e-06, "loss": 1.0917, "step": 21822 }, { "epoch": 0.66, "learning_rate": 1.3873241426588885e-06, "loss": 1.0625, "step": 21823 }, { "epoch": 0.66, "learning_rate": 1.38710571862258e-06, "loss": 1.1714, "step": 21824 }, { "epoch": 0.66, "learning_rate": 1.3868873051804896e-06, "loss": 1.1389, "step": 21825 }, { "epoch": 0.66, "learning_rate": 1.3866689023346969e-06, "loss": 1.0391, "step": 21826 }, { "epoch": 0.66, "learning_rate": 1.3864505100872787e-06, "loss": 1.1331, "step": 21827 }, { "epoch": 0.66, "learning_rate": 1.3862321284403155e-06, "loss": 1.1344, "step": 21828 }, { "epoch": 0.66, "learning_rate": 1.386013757395886e-06, "loss": 1.1811, "step": 21829 }, { "epoch": 0.66, "learning_rate": 1.38579539695607e-06, "loss": 1.1822, "step": 21830 }, { "epoch": 0.66, "learning_rate": 1.3855770471229443e-06, "loss": 1.2178, "step": 21831 }, { "epoch": 0.66, "learning_rate": 1.3853587078985884e-06, "loss": 1.1256, "step": 21832 }, { "epoch": 0.66, "learning_rate": 1.3851403792850807e-06, "loss": 0.9529, "step": 21833 }, { "epoch": 0.66, "learning_rate": 1.3849220612844997e-06, "loss": 1.0355, "step": 21834 }, { "epoch": 0.66, "learning_rate": 1.3847037538989243e-06, "loss": 1.0671, "step": 21835 }, { "epoch": 0.66, "learning_rate": 1.3844854571304318e-06, "loss": 1.1085, "step": 21836 }, { "epoch": 0.66, "learning_rate": 1.3842671709810996e-06, "loss": 1.2604, "step": 21837 }, { "epoch": 0.66, "learning_rate": 1.384048895453007e-06, "loss": 1.1066, "step": 21838 }, { "epoch": 0.66, "learning_rate": 1.3838306305482325e-06, "loss": 1.114, "step": 21839 }, { "epoch": 0.66, "learning_rate": 1.3836123762688518e-06, "loss": 1.0682, "step": 21840 }, { "epoch": 0.66, "learning_rate": 1.3833941326169437e-06, "loss": 1.1345, "step": 21841 }, { "epoch": 0.66, "learning_rate": 1.3831758995945854e-06, "loss": 1.1183, "step": 21842 }, { "epoch": 0.66, "learning_rate": 1.382957677203856e-06, "loss": 1.3124, "step": 21843 }, { "epoch": 0.66, "learning_rate": 1.3827394654468302e-06, "loss": 1.1011, "step": 21844 }, { "epoch": 0.66, "learning_rate": 1.382521264325587e-06, "loss": 1.0553, "step": 21845 }, { "epoch": 0.66, "learning_rate": 1.3823030738422026e-06, "loss": 1.0983, "step": 21846 }, { "epoch": 0.66, "learning_rate": 1.3820848939987552e-06, "loss": 1.0962, "step": 21847 }, { "epoch": 0.66, "learning_rate": 1.3818667247973208e-06, "loss": 1.0707, "step": 21848 }, { "epoch": 0.66, "learning_rate": 1.381648566239977e-06, "loss": 1.0587, "step": 21849 }, { "epoch": 0.66, "learning_rate": 1.3814304183288e-06, "loss": 1.0485, "step": 21850 }, { "epoch": 0.66, "learning_rate": 1.3812122810658667e-06, "loss": 1.0209, "step": 21851 }, { "epoch": 0.66, "learning_rate": 1.3809941544532545e-06, "loss": 1.1083, "step": 21852 }, { "epoch": 0.66, "learning_rate": 1.3807760384930385e-06, "loss": 1.1542, "step": 21853 }, { "epoch": 0.66, "learning_rate": 1.3805579331872954e-06, "loss": 1.1218, "step": 21854 }, { "epoch": 0.66, "learning_rate": 1.3803398385381012e-06, "loss": 1.2839, "step": 21855 }, { "epoch": 0.66, "learning_rate": 1.3801217545475338e-06, "loss": 1.0593, "step": 21856 }, { "epoch": 0.66, "learning_rate": 1.379903681217667e-06, "loss": 1.1135, "step": 21857 }, { "epoch": 0.66, "learning_rate": 1.3796856185505778e-06, "loss": 0.9601, "step": 21858 }, { "epoch": 0.66, "learning_rate": 1.3794675665483418e-06, "loss": 1.2166, "step": 21859 }, { "epoch": 0.66, "learning_rate": 1.379249525213035e-06, "loss": 1.0917, "step": 21860 }, { "epoch": 0.66, "learning_rate": 1.3790314945467337e-06, "loss": 1.0367, "step": 21861 }, { "epoch": 0.66, "learning_rate": 1.3788134745515118e-06, "loss": 1.3083, "step": 21862 }, { "epoch": 0.66, "learning_rate": 1.378595465229446e-06, "loss": 1.1926, "step": 21863 }, { "epoch": 0.66, "learning_rate": 1.3783774665826109e-06, "loss": 1.0769, "step": 21864 }, { "epoch": 0.66, "learning_rate": 1.378159478613083e-06, "loss": 1.1202, "step": 21865 }, { "epoch": 0.66, "learning_rate": 1.3779415013229358e-06, "loss": 1.0207, "step": 21866 }, { "epoch": 0.66, "learning_rate": 1.3777235347142453e-06, "loss": 1.1379, "step": 21867 }, { "epoch": 0.66, "learning_rate": 1.377505578789086e-06, "loss": 1.1356, "step": 21868 }, { "epoch": 0.66, "learning_rate": 1.3772876335495339e-06, "loss": 1.2132, "step": 21869 }, { "epoch": 0.66, "learning_rate": 1.3770696989976618e-06, "loss": 1.1722, "step": 21870 }, { "epoch": 0.66, "learning_rate": 1.3768517751355456e-06, "loss": 1.2126, "step": 21871 }, { "epoch": 0.66, "learning_rate": 1.3766338619652595e-06, "loss": 1.1732, "step": 21872 }, { "epoch": 0.66, "learning_rate": 1.3764159594888778e-06, "loss": 1.1334, "step": 21873 }, { "epoch": 0.66, "learning_rate": 1.3761980677084752e-06, "loss": 1.1558, "step": 21874 }, { "epoch": 0.66, "learning_rate": 1.3759801866261259e-06, "loss": 1.0865, "step": 21875 }, { "epoch": 0.66, "learning_rate": 1.3757623162439035e-06, "loss": 1.0079, "step": 21876 }, { "epoch": 0.66, "learning_rate": 1.3755444565638827e-06, "loss": 1.0945, "step": 21877 }, { "epoch": 0.66, "learning_rate": 1.3753266075881378e-06, "loss": 1.1896, "step": 21878 }, { "epoch": 0.66, "learning_rate": 1.3751087693187412e-06, "loss": 1.0474, "step": 21879 }, { "epoch": 0.66, "learning_rate": 1.3748909417577673e-06, "loss": 1.1808, "step": 21880 }, { "epoch": 0.66, "learning_rate": 1.3746731249072897e-06, "loss": 1.2555, "step": 21881 }, { "epoch": 0.66, "learning_rate": 1.3744553187693832e-06, "loss": 1.1682, "step": 21882 }, { "epoch": 0.66, "learning_rate": 1.3742375233461186e-06, "loss": 1.1127, "step": 21883 }, { "epoch": 0.66, "learning_rate": 1.374019738639571e-06, "loss": 1.0443, "step": 21884 }, { "epoch": 0.66, "learning_rate": 1.373801964651813e-06, "loss": 1.054, "step": 21885 }, { "epoch": 0.66, "learning_rate": 1.3735842013849187e-06, "loss": 1.1835, "step": 21886 }, { "epoch": 0.66, "learning_rate": 1.3733664488409598e-06, "loss": 1.136, "step": 21887 }, { "epoch": 0.66, "learning_rate": 1.3731487070220095e-06, "loss": 1.1158, "step": 21888 }, { "epoch": 0.66, "learning_rate": 1.3729309759301407e-06, "loss": 1.2152, "step": 21889 }, { "epoch": 0.66, "learning_rate": 1.372713255567426e-06, "loss": 1.0325, "step": 21890 }, { "epoch": 0.66, "learning_rate": 1.3724955459359397e-06, "loss": 1.0983, "step": 21891 }, { "epoch": 0.66, "learning_rate": 1.3722778470377512e-06, "loss": 1.1368, "step": 21892 }, { "epoch": 0.66, "learning_rate": 1.372060158874935e-06, "loss": 1.1278, "step": 21893 }, { "epoch": 0.66, "learning_rate": 1.3718424814495623e-06, "loss": 1.1552, "step": 21894 }, { "epoch": 0.66, "learning_rate": 1.3716248147637073e-06, "loss": 1.1, "step": 21895 }, { "epoch": 0.66, "learning_rate": 1.3714071588194394e-06, "loss": 1.0474, "step": 21896 }, { "epoch": 0.66, "learning_rate": 1.371189513618832e-06, "loss": 1.1326, "step": 21897 }, { "epoch": 0.66, "learning_rate": 1.3709718791639564e-06, "loss": 1.0849, "step": 21898 }, { "epoch": 0.66, "learning_rate": 1.3707542554568847e-06, "loss": 1.2541, "step": 21899 }, { "epoch": 0.66, "learning_rate": 1.370536642499689e-06, "loss": 1.1772, "step": 21900 }, { "epoch": 0.66, "learning_rate": 1.3703190402944406e-06, "loss": 1.0643, "step": 21901 }, { "epoch": 0.66, "learning_rate": 1.3701014488432107e-06, "loss": 1.1014, "step": 21902 }, { "epoch": 0.66, "learning_rate": 1.3698838681480717e-06, "loss": 1.142, "step": 21903 }, { "epoch": 0.66, "learning_rate": 1.369666298211093e-06, "loss": 1.1108, "step": 21904 }, { "epoch": 0.66, "learning_rate": 1.369448739034347e-06, "loss": 1.1561, "step": 21905 }, { "epoch": 0.66, "learning_rate": 1.369231190619904e-06, "loss": 1.2256, "step": 21906 }, { "epoch": 0.66, "learning_rate": 1.3690136529698361e-06, "loss": 1.0336, "step": 21907 }, { "epoch": 0.66, "learning_rate": 1.3687961260862142e-06, "loss": 1.1108, "step": 21908 }, { "epoch": 0.66, "learning_rate": 1.3685786099711073e-06, "loss": 1.0961, "step": 21909 }, { "epoch": 0.66, "learning_rate": 1.3683611046265872e-06, "loss": 1.0872, "step": 21910 }, { "epoch": 0.66, "learning_rate": 1.3681436100547246e-06, "loss": 1.1474, "step": 21911 }, { "epoch": 0.66, "learning_rate": 1.3679261262575905e-06, "loss": 1.313, "step": 21912 }, { "epoch": 0.66, "learning_rate": 1.3677086532372535e-06, "loss": 1.0492, "step": 21913 }, { "epoch": 0.66, "learning_rate": 1.3674911909957847e-06, "loss": 1.1956, "step": 21914 }, { "epoch": 0.66, "learning_rate": 1.3672737395352543e-06, "loss": 1.0399, "step": 21915 }, { "epoch": 0.66, "learning_rate": 1.3670562988577323e-06, "loss": 1.0605, "step": 21916 }, { "epoch": 0.66, "learning_rate": 1.3668388689652901e-06, "loss": 1.0765, "step": 21917 }, { "epoch": 0.66, "learning_rate": 1.3666214498599948e-06, "loss": 1.1341, "step": 21918 }, { "epoch": 0.66, "learning_rate": 1.3664040415439172e-06, "loss": 1.1779, "step": 21919 }, { "epoch": 0.66, "learning_rate": 1.3661866440191277e-06, "loss": 1.1852, "step": 21920 }, { "epoch": 0.66, "learning_rate": 1.365969257287696e-06, "loss": 1.0545, "step": 21921 }, { "epoch": 0.66, "learning_rate": 1.36575188135169e-06, "loss": 1.1313, "step": 21922 }, { "epoch": 0.66, "learning_rate": 1.3655345162131795e-06, "loss": 1.0515, "step": 21923 }, { "epoch": 0.66, "learning_rate": 1.3653171618742341e-06, "loss": 1.1419, "step": 21924 }, { "epoch": 0.66, "learning_rate": 1.3650998183369241e-06, "loss": 1.0662, "step": 21925 }, { "epoch": 0.66, "learning_rate": 1.364882485603316e-06, "loss": 1.0844, "step": 21926 }, { "epoch": 0.66, "learning_rate": 1.36466516367548e-06, "loss": 1.0864, "step": 21927 }, { "epoch": 0.66, "learning_rate": 1.364447852555485e-06, "loss": 1.036, "step": 21928 }, { "epoch": 0.66, "learning_rate": 1.364230552245399e-06, "loss": 1.1992, "step": 21929 }, { "epoch": 0.66, "learning_rate": 1.3640132627472919e-06, "loss": 1.2276, "step": 21930 }, { "epoch": 0.66, "learning_rate": 1.3637959840632308e-06, "loss": 1.1709, "step": 21931 }, { "epoch": 0.66, "learning_rate": 1.3635787161952852e-06, "loss": 1.1497, "step": 21932 }, { "epoch": 0.66, "learning_rate": 1.3633614591455228e-06, "loss": 1.047, "step": 21933 }, { "epoch": 0.66, "learning_rate": 1.3631442129160128e-06, "loss": 1.1282, "step": 21934 }, { "epoch": 0.66, "learning_rate": 1.362926977508821e-06, "loss": 1.1641, "step": 21935 }, { "epoch": 0.66, "learning_rate": 1.3627097529260174e-06, "loss": 1.1649, "step": 21936 }, { "epoch": 0.66, "learning_rate": 1.3624925391696686e-06, "loss": 1.1186, "step": 21937 }, { "epoch": 0.66, "learning_rate": 1.3622753362418446e-06, "loss": 1.1442, "step": 21938 }, { "epoch": 0.66, "learning_rate": 1.3620581441446102e-06, "loss": 1.0956, "step": 21939 }, { "epoch": 0.66, "learning_rate": 1.361840962880034e-06, "loss": 1.1942, "step": 21940 }, { "epoch": 0.66, "learning_rate": 1.3616237924501837e-06, "loss": 1.0463, "step": 21941 }, { "epoch": 0.66, "learning_rate": 1.3614066328571267e-06, "loss": 1.0675, "step": 21942 }, { "epoch": 0.66, "learning_rate": 1.3611894841029314e-06, "loss": 1.0715, "step": 21943 }, { "epoch": 0.66, "learning_rate": 1.3609723461896626e-06, "loss": 1.0792, "step": 21944 }, { "epoch": 0.66, "learning_rate": 1.3607552191193885e-06, "loss": 1.1151, "step": 21945 }, { "epoch": 0.66, "learning_rate": 1.3605381028941761e-06, "loss": 0.9537, "step": 21946 }, { "epoch": 0.66, "learning_rate": 1.3603209975160931e-06, "loss": 1.1138, "step": 21947 }, { "epoch": 0.66, "learning_rate": 1.3601039029872043e-06, "loss": 1.1149, "step": 21948 }, { "epoch": 0.66, "learning_rate": 1.359886819309577e-06, "loss": 1.1341, "step": 21949 }, { "epoch": 0.66, "learning_rate": 1.3596697464852788e-06, "loss": 1.1406, "step": 21950 }, { "epoch": 0.66, "learning_rate": 1.3594526845163758e-06, "loss": 1.1193, "step": 21951 }, { "epoch": 0.66, "learning_rate": 1.3592356334049334e-06, "loss": 1.0588, "step": 21952 }, { "epoch": 0.66, "learning_rate": 1.359018593153018e-06, "loss": 1.0732, "step": 21953 }, { "epoch": 0.66, "learning_rate": 1.358801563762696e-06, "loss": 1.2349, "step": 21954 }, { "epoch": 0.66, "learning_rate": 1.3585845452360342e-06, "loss": 1.0976, "step": 21955 }, { "epoch": 0.66, "learning_rate": 1.3583675375750971e-06, "loss": 1.1768, "step": 21956 }, { "epoch": 0.66, "learning_rate": 1.3581505407819515e-06, "loss": 1.1379, "step": 21957 }, { "epoch": 0.66, "learning_rate": 1.3579335548586628e-06, "loss": 1.0914, "step": 21958 }, { "epoch": 0.66, "learning_rate": 1.3577165798072966e-06, "loss": 1.0715, "step": 21959 }, { "epoch": 0.66, "learning_rate": 1.3574996156299192e-06, "loss": 1.1139, "step": 21960 }, { "epoch": 0.66, "learning_rate": 1.3572826623285945e-06, "loss": 1.1248, "step": 21961 }, { "epoch": 0.66, "learning_rate": 1.3570657199053882e-06, "loss": 1.186, "step": 21962 }, { "epoch": 0.66, "learning_rate": 1.3568487883623662e-06, "loss": 1.1481, "step": 21963 }, { "epoch": 0.66, "learning_rate": 1.3566318677015937e-06, "loss": 1.0364, "step": 21964 }, { "epoch": 0.66, "learning_rate": 1.3564149579251345e-06, "loss": 1.078, "step": 21965 }, { "epoch": 0.66, "learning_rate": 1.3561980590350543e-06, "loss": 1.1926, "step": 21966 }, { "epoch": 0.66, "learning_rate": 1.3559811710334176e-06, "loss": 1.1703, "step": 21967 }, { "epoch": 0.66, "learning_rate": 1.355764293922289e-06, "loss": 1.0821, "step": 21968 }, { "epoch": 0.66, "learning_rate": 1.3555474277037342e-06, "loss": 1.2199, "step": 21969 }, { "epoch": 0.66, "learning_rate": 1.3553305723798158e-06, "loss": 1.1071, "step": 21970 }, { "epoch": 0.66, "learning_rate": 1.355113727952599e-06, "loss": 1.1069, "step": 21971 }, { "epoch": 0.66, "learning_rate": 1.354896894424148e-06, "loss": 1.0554, "step": 21972 }, { "epoch": 0.66, "learning_rate": 1.3546800717965283e-06, "loss": 1.1044, "step": 21973 }, { "epoch": 0.66, "learning_rate": 1.3544632600718015e-06, "loss": 1.0403, "step": 21974 }, { "epoch": 0.66, "learning_rate": 1.3542464592520333e-06, "loss": 1.1334, "step": 21975 }, { "epoch": 0.66, "learning_rate": 1.3540296693392863e-06, "loss": 1.0997, "step": 21976 }, { "epoch": 0.66, "learning_rate": 1.3538128903356262e-06, "loss": 0.9975, "step": 21977 }, { "epoch": 0.66, "learning_rate": 1.3535961222431143e-06, "loss": 1.0865, "step": 21978 }, { "epoch": 0.66, "learning_rate": 1.3533793650638155e-06, "loss": 1.1127, "step": 21979 }, { "epoch": 0.66, "learning_rate": 1.3531626187997926e-06, "loss": 1.1123, "step": 21980 }, { "epoch": 0.66, "learning_rate": 1.3529458834531092e-06, "loss": 1.1777, "step": 21981 }, { "epoch": 0.66, "learning_rate": 1.3527291590258288e-06, "loss": 1.0955, "step": 21982 }, { "epoch": 0.66, "learning_rate": 1.352512445520014e-06, "loss": 1.1564, "step": 21983 }, { "epoch": 0.66, "learning_rate": 1.3522957429377281e-06, "loss": 1.1238, "step": 21984 }, { "epoch": 0.66, "learning_rate": 1.352079051281035e-06, "loss": 1.0859, "step": 21985 }, { "epoch": 0.66, "learning_rate": 1.3518623705519957e-06, "loss": 1.1505, "step": 21986 }, { "epoch": 0.66, "learning_rate": 1.3516457007526733e-06, "loss": 1.0976, "step": 21987 }, { "epoch": 0.66, "learning_rate": 1.351429041885131e-06, "loss": 1.1423, "step": 21988 }, { "epoch": 0.66, "learning_rate": 1.351212393951431e-06, "loss": 1.1282, "step": 21989 }, { "epoch": 0.66, "learning_rate": 1.350995756953637e-06, "loss": 1.0439, "step": 21990 }, { "epoch": 0.66, "learning_rate": 1.3507791308938086e-06, "loss": 1.1386, "step": 21991 }, { "epoch": 0.66, "learning_rate": 1.3505625157740095e-06, "loss": 1.1218, "step": 21992 }, { "epoch": 0.66, "learning_rate": 1.3503459115963019e-06, "loss": 1.1441, "step": 21993 }, { "epoch": 0.66, "learning_rate": 1.3501293183627472e-06, "loss": 1.0747, "step": 21994 }, { "epoch": 0.66, "learning_rate": 1.3499127360754088e-06, "loss": 1.0696, "step": 21995 }, { "epoch": 0.66, "learning_rate": 1.349696164736346e-06, "loss": 1.1204, "step": 21996 }, { "epoch": 0.66, "learning_rate": 1.3494796043476222e-06, "loss": 1.2415, "step": 21997 }, { "epoch": 0.66, "learning_rate": 1.3492630549112981e-06, "loss": 1.0812, "step": 21998 }, { "epoch": 0.66, "learning_rate": 1.3490465164294365e-06, "loss": 1.1214, "step": 21999 }, { "epoch": 0.66, "learning_rate": 1.3488299889040968e-06, "loss": 1.0505, "step": 22000 }, { "epoch": 0.66, "learning_rate": 1.348613472337341e-06, "loss": 1.1155, "step": 22001 }, { "epoch": 0.66, "learning_rate": 1.3483969667312307e-06, "loss": 1.1732, "step": 22002 }, { "epoch": 0.66, "learning_rate": 1.3481804720878277e-06, "loss": 1.0907, "step": 22003 }, { "epoch": 0.66, "learning_rate": 1.3479639884091905e-06, "loss": 1.1762, "step": 22004 }, { "epoch": 0.66, "learning_rate": 1.3477475156973818e-06, "loss": 1.1987, "step": 22005 }, { "epoch": 0.66, "learning_rate": 1.3475310539544614e-06, "loss": 1.1015, "step": 22006 }, { "epoch": 0.66, "learning_rate": 1.3473146031824904e-06, "loss": 1.2322, "step": 22007 }, { "epoch": 0.66, "learning_rate": 1.3470981633835302e-06, "loss": 1.1991, "step": 22008 }, { "epoch": 0.66, "learning_rate": 1.3468817345596393e-06, "loss": 1.1193, "step": 22009 }, { "epoch": 0.66, "learning_rate": 1.346665316712879e-06, "loss": 1.083, "step": 22010 }, { "epoch": 0.66, "learning_rate": 1.3464489098453092e-06, "loss": 1.0375, "step": 22011 }, { "epoch": 0.66, "learning_rate": 1.3462325139589904e-06, "loss": 1.0447, "step": 22012 }, { "epoch": 0.66, "learning_rate": 1.3460161290559826e-06, "loss": 1.0804, "step": 22013 }, { "epoch": 0.66, "learning_rate": 1.345799755138345e-06, "loss": 1.2101, "step": 22014 }, { "epoch": 0.66, "learning_rate": 1.345583392208138e-06, "loss": 1.0576, "step": 22015 }, { "epoch": 0.66, "learning_rate": 1.3453670402674224e-06, "loss": 1.1447, "step": 22016 }, { "epoch": 0.66, "learning_rate": 1.345150699318255e-06, "loss": 1.1185, "step": 22017 }, { "epoch": 0.66, "learning_rate": 1.344934369362697e-06, "loss": 1.1591, "step": 22018 }, { "epoch": 0.66, "learning_rate": 1.3447180504028076e-06, "loss": 1.0989, "step": 22019 }, { "epoch": 0.66, "learning_rate": 1.344501742440646e-06, "loss": 1.1259, "step": 22020 }, { "epoch": 0.66, "learning_rate": 1.3442854454782723e-06, "loss": 1.0745, "step": 22021 }, { "epoch": 0.66, "learning_rate": 1.344069159517743e-06, "loss": 1.0264, "step": 22022 }, { "epoch": 0.66, "learning_rate": 1.3438528845611192e-06, "loss": 1.108, "step": 22023 }, { "epoch": 0.66, "learning_rate": 1.343636620610459e-06, "loss": 1.1683, "step": 22024 }, { "epoch": 0.66, "learning_rate": 1.343420367667822e-06, "loss": 1.124, "step": 22025 }, { "epoch": 0.66, "learning_rate": 1.3432041257352652e-06, "loss": 0.9772, "step": 22026 }, { "epoch": 0.66, "learning_rate": 1.3429878948148485e-06, "loss": 1.1406, "step": 22027 }, { "epoch": 0.66, "learning_rate": 1.342771674908629e-06, "loss": 1.0552, "step": 22028 }, { "epoch": 0.66, "learning_rate": 1.342555466018667e-06, "loss": 1.0937, "step": 22029 }, { "epoch": 0.66, "learning_rate": 1.3423392681470189e-06, "loss": 1.2874, "step": 22030 }, { "epoch": 0.66, "learning_rate": 1.342123081295743e-06, "loss": 1.274, "step": 22031 }, { "epoch": 0.66, "learning_rate": 1.341906905466898e-06, "loss": 1.1363, "step": 22032 }, { "epoch": 0.66, "learning_rate": 1.3416907406625414e-06, "loss": 1.0245, "step": 22033 }, { "epoch": 0.66, "learning_rate": 1.3414745868847324e-06, "loss": 1.0848, "step": 22034 }, { "epoch": 0.66, "learning_rate": 1.341258444135526e-06, "loss": 1.1351, "step": 22035 }, { "epoch": 0.66, "learning_rate": 1.341042312416981e-06, "loss": 1.2012, "step": 22036 }, { "epoch": 0.66, "learning_rate": 1.3408261917311554e-06, "loss": 1.1346, "step": 22037 }, { "epoch": 0.66, "learning_rate": 1.340610082080106e-06, "loss": 1.0383, "step": 22038 }, { "epoch": 0.66, "learning_rate": 1.3403939834658901e-06, "loss": 1.1093, "step": 22039 }, { "epoch": 0.66, "learning_rate": 1.3401778958905654e-06, "loss": 1.2042, "step": 22040 }, { "epoch": 0.66, "learning_rate": 1.3399618193561881e-06, "loss": 1.1349, "step": 22041 }, { "epoch": 0.66, "learning_rate": 1.3397457538648167e-06, "loss": 1.0535, "step": 22042 }, { "epoch": 0.66, "learning_rate": 1.339529699418506e-06, "loss": 1.0634, "step": 22043 }, { "epoch": 0.66, "learning_rate": 1.3393136560193136e-06, "loss": 1.2299, "step": 22044 }, { "epoch": 0.66, "learning_rate": 1.3390976236692962e-06, "loss": 1.1764, "step": 22045 }, { "epoch": 0.66, "learning_rate": 1.3388816023705104e-06, "loss": 1.0589, "step": 22046 }, { "epoch": 0.66, "learning_rate": 1.3386655921250135e-06, "loss": 1.0656, "step": 22047 }, { "epoch": 0.66, "learning_rate": 1.3384495929348598e-06, "loss": 1.1565, "step": 22048 }, { "epoch": 0.66, "learning_rate": 1.3382336048021066e-06, "loss": 1.1664, "step": 22049 }, { "epoch": 0.66, "learning_rate": 1.3380176277288098e-06, "loss": 1.0164, "step": 22050 }, { "epoch": 0.66, "learning_rate": 1.337801661717027e-06, "loss": 1.1502, "step": 22051 }, { "epoch": 0.66, "learning_rate": 1.3375857067688113e-06, "loss": 1.1476, "step": 22052 }, { "epoch": 0.66, "learning_rate": 1.3373697628862198e-06, "loss": 1.0825, "step": 22053 }, { "epoch": 0.66, "learning_rate": 1.3371538300713082e-06, "loss": 1.2035, "step": 22054 }, { "epoch": 0.66, "learning_rate": 1.336937908326133e-06, "loss": 1.3126, "step": 22055 }, { "epoch": 0.66, "learning_rate": 1.3367219976527483e-06, "loss": 1.1717, "step": 22056 }, { "epoch": 0.66, "learning_rate": 1.3365060980532097e-06, "loss": 1.1121, "step": 22057 }, { "epoch": 0.66, "learning_rate": 1.3362902095295722e-06, "loss": 1.0311, "step": 22058 }, { "epoch": 0.66, "learning_rate": 1.3360743320838921e-06, "loss": 1.0226, "step": 22059 }, { "epoch": 0.66, "learning_rate": 1.3358584657182244e-06, "loss": 1.046, "step": 22060 }, { "epoch": 0.66, "learning_rate": 1.3356426104346223e-06, "loss": 1.1133, "step": 22061 }, { "epoch": 0.66, "learning_rate": 1.3354267662351421e-06, "loss": 1.1337, "step": 22062 }, { "epoch": 0.66, "learning_rate": 1.3352109331218382e-06, "loss": 1.0856, "step": 22063 }, { "epoch": 0.66, "learning_rate": 1.3349951110967651e-06, "loss": 1.0908, "step": 22064 }, { "epoch": 0.66, "learning_rate": 1.3347793001619775e-06, "loss": 1.0699, "step": 22065 }, { "epoch": 0.66, "learning_rate": 1.3345635003195299e-06, "loss": 1.0872, "step": 22066 }, { "epoch": 0.66, "learning_rate": 1.334347711571477e-06, "loss": 1.0105, "step": 22067 }, { "epoch": 0.66, "learning_rate": 1.3341319339198722e-06, "loss": 1.0496, "step": 22068 }, { "epoch": 0.66, "learning_rate": 1.3339161673667694e-06, "loss": 1.0654, "step": 22069 }, { "epoch": 0.66, "learning_rate": 1.3337004119142234e-06, "loss": 1.0559, "step": 22070 }, { "epoch": 0.66, "learning_rate": 1.3334846675642874e-06, "loss": 1.0215, "step": 22071 }, { "epoch": 0.66, "learning_rate": 1.333268934319017e-06, "loss": 1.0455, "step": 22072 }, { "epoch": 0.66, "learning_rate": 1.333053212180463e-06, "loss": 1.0976, "step": 22073 }, { "epoch": 0.66, "learning_rate": 1.3328375011506805e-06, "loss": 1.0839, "step": 22074 }, { "epoch": 0.67, "learning_rate": 1.332621801231723e-06, "loss": 1.1708, "step": 22075 }, { "epoch": 0.67, "learning_rate": 1.3324061124256437e-06, "loss": 1.095, "step": 22076 }, { "epoch": 0.67, "learning_rate": 1.3321904347344965e-06, "loss": 0.9979, "step": 22077 }, { "epoch": 0.67, "learning_rate": 1.3319747681603335e-06, "loss": 1.0496, "step": 22078 }, { "epoch": 0.67, "learning_rate": 1.3317591127052079e-06, "loss": 1.1465, "step": 22079 }, { "epoch": 0.67, "learning_rate": 1.331543468371173e-06, "loss": 1.1226, "step": 22080 }, { "epoch": 0.67, "learning_rate": 1.3313278351602823e-06, "loss": 1.1447, "step": 22081 }, { "epoch": 0.67, "learning_rate": 1.3311122130745868e-06, "loss": 1.0963, "step": 22082 }, { "epoch": 0.67, "learning_rate": 1.3308966021161405e-06, "loss": 1.1321, "step": 22083 }, { "epoch": 0.67, "learning_rate": 1.330681002286995e-06, "loss": 1.0722, "step": 22084 }, { "epoch": 0.67, "learning_rate": 1.3304654135892042e-06, "loss": 1.1465, "step": 22085 }, { "epoch": 0.67, "learning_rate": 1.3302498360248188e-06, "loss": 1.1698, "step": 22086 }, { "epoch": 0.67, "learning_rate": 1.3300342695958912e-06, "loss": 1.098, "step": 22087 }, { "epoch": 0.67, "learning_rate": 1.3298187143044743e-06, "loss": 1.0726, "step": 22088 }, { "epoch": 0.67, "learning_rate": 1.3296031701526195e-06, "loss": 1.0403, "step": 22089 }, { "epoch": 0.67, "learning_rate": 1.3293876371423798e-06, "loss": 1.1078, "step": 22090 }, { "epoch": 0.67, "learning_rate": 1.3291721152758046e-06, "loss": 1.0444, "step": 22091 }, { "epoch": 0.67, "learning_rate": 1.3289566045549474e-06, "loss": 1.2599, "step": 22092 }, { "epoch": 0.67, "learning_rate": 1.3287411049818593e-06, "loss": 1.1418, "step": 22093 }, { "epoch": 0.67, "learning_rate": 1.3285256165585916e-06, "loss": 1.0919, "step": 22094 }, { "epoch": 0.67, "learning_rate": 1.3283101392871961e-06, "loss": 1.1115, "step": 22095 }, { "epoch": 0.67, "learning_rate": 1.3280946731697237e-06, "loss": 1.138, "step": 22096 }, { "epoch": 0.67, "learning_rate": 1.3278792182082257e-06, "loss": 1.1158, "step": 22097 }, { "epoch": 0.67, "learning_rate": 1.3276637744047535e-06, "loss": 1.233, "step": 22098 }, { "epoch": 0.67, "learning_rate": 1.3274483417613572e-06, "loss": 1.2217, "step": 22099 }, { "epoch": 0.67, "learning_rate": 1.3272329202800877e-06, "loss": 1.1821, "step": 22100 }, { "epoch": 0.67, "learning_rate": 1.3270175099629956e-06, "loss": 1.1104, "step": 22101 }, { "epoch": 0.67, "learning_rate": 1.3268021108121324e-06, "loss": 1.1301, "step": 22102 }, { "epoch": 0.67, "learning_rate": 1.3265867228295487e-06, "loss": 1.06, "step": 22103 }, { "epoch": 0.67, "learning_rate": 1.3263713460172936e-06, "loss": 1.1423, "step": 22104 }, { "epoch": 0.67, "learning_rate": 1.3261559803774179e-06, "loss": 1.1444, "step": 22105 }, { "epoch": 0.67, "learning_rate": 1.325940625911972e-06, "loss": 1.1414, "step": 22106 }, { "epoch": 0.67, "learning_rate": 1.3257252826230068e-06, "loss": 1.0753, "step": 22107 }, { "epoch": 0.67, "learning_rate": 1.3255099505125705e-06, "loss": 1.1736, "step": 22108 }, { "epoch": 0.67, "learning_rate": 1.3252946295827135e-06, "loss": 1.0784, "step": 22109 }, { "epoch": 0.67, "learning_rate": 1.325079319835486e-06, "loss": 1.1678, "step": 22110 }, { "epoch": 0.67, "learning_rate": 1.3248640212729388e-06, "loss": 1.2104, "step": 22111 }, { "epoch": 0.67, "learning_rate": 1.324648733897119e-06, "loss": 1.1633, "step": 22112 }, { "epoch": 0.67, "learning_rate": 1.324433457710077e-06, "loss": 1.0764, "step": 22113 }, { "epoch": 0.67, "learning_rate": 1.3242181927138625e-06, "loss": 1.0839, "step": 22114 }, { "epoch": 0.67, "learning_rate": 1.3240029389105246e-06, "loss": 1.1501, "step": 22115 }, { "epoch": 0.67, "learning_rate": 1.3237876963021131e-06, "loss": 1.046, "step": 22116 }, { "epoch": 0.67, "learning_rate": 1.3235724648906757e-06, "loss": 1.0259, "step": 22117 }, { "epoch": 0.67, "learning_rate": 1.323357244678261e-06, "loss": 1.1357, "step": 22118 }, { "epoch": 0.67, "learning_rate": 1.3231420356669194e-06, "loss": 1.1792, "step": 22119 }, { "epoch": 0.67, "learning_rate": 1.3229268378586984e-06, "loss": 1.1404, "step": 22120 }, { "epoch": 0.67, "learning_rate": 1.3227116512556473e-06, "loss": 1.012, "step": 22121 }, { "epoch": 0.67, "learning_rate": 1.3224964758598141e-06, "loss": 1.1798, "step": 22122 }, { "epoch": 0.67, "learning_rate": 1.3222813116732475e-06, "loss": 1.0793, "step": 22123 }, { "epoch": 0.67, "learning_rate": 1.3220661586979965e-06, "loss": 1.14, "step": 22124 }, { "epoch": 0.67, "learning_rate": 1.3218510169361073e-06, "loss": 1.1265, "step": 22125 }, { "epoch": 0.67, "learning_rate": 1.3216358863896291e-06, "loss": 1.0627, "step": 22126 }, { "epoch": 0.67, "learning_rate": 1.3214207670606099e-06, "loss": 1.0853, "step": 22127 }, { "epoch": 0.67, "learning_rate": 1.3212056589510968e-06, "loss": 1.0153, "step": 22128 }, { "epoch": 0.67, "learning_rate": 1.3209905620631397e-06, "loss": 1.0968, "step": 22129 }, { "epoch": 0.67, "learning_rate": 1.3207754763987834e-06, "loss": 1.2183, "step": 22130 }, { "epoch": 0.67, "learning_rate": 1.3205604019600764e-06, "loss": 1.2093, "step": 22131 }, { "epoch": 0.67, "learning_rate": 1.3203453387490666e-06, "loss": 1.1431, "step": 22132 }, { "epoch": 0.67, "learning_rate": 1.3201302867678024e-06, "loss": 1.1323, "step": 22133 }, { "epoch": 0.67, "learning_rate": 1.319915246018328e-06, "loss": 1.0429, "step": 22134 }, { "epoch": 0.67, "learning_rate": 1.3197002165026922e-06, "loss": 1.0264, "step": 22135 }, { "epoch": 0.67, "learning_rate": 1.3194851982229424e-06, "loss": 1.1179, "step": 22136 }, { "epoch": 0.67, "learning_rate": 1.3192701911811253e-06, "loss": 1.14, "step": 22137 }, { "epoch": 0.67, "learning_rate": 1.3190551953792867e-06, "loss": 1.1257, "step": 22138 }, { "epoch": 0.67, "learning_rate": 1.3188402108194736e-06, "loss": 1.0963, "step": 22139 }, { "epoch": 0.67, "learning_rate": 1.3186252375037334e-06, "loss": 1.0369, "step": 22140 }, { "epoch": 0.67, "learning_rate": 1.3184102754341116e-06, "loss": 1.0801, "step": 22141 }, { "epoch": 0.67, "learning_rate": 1.3181953246126555e-06, "loss": 1.1733, "step": 22142 }, { "epoch": 0.67, "learning_rate": 1.3179803850414102e-06, "loss": 1.1389, "step": 22143 }, { "epoch": 0.67, "learning_rate": 1.3177654567224225e-06, "loss": 1.0507, "step": 22144 }, { "epoch": 0.67, "learning_rate": 1.317550539657738e-06, "loss": 1.0619, "step": 22145 }, { "epoch": 0.67, "learning_rate": 1.3173356338494028e-06, "loss": 1.0754, "step": 22146 }, { "epoch": 0.67, "learning_rate": 1.3171207392994628e-06, "loss": 0.998, "step": 22147 }, { "epoch": 0.67, "learning_rate": 1.316905856009964e-06, "loss": 1.0679, "step": 22148 }, { "epoch": 0.67, "learning_rate": 1.316690983982951e-06, "loss": 1.1926, "step": 22149 }, { "epoch": 0.67, "learning_rate": 1.3164761232204716e-06, "loss": 0.937, "step": 22150 }, { "epoch": 0.67, "learning_rate": 1.3162612737245683e-06, "loss": 1.045, "step": 22151 }, { "epoch": 0.67, "learning_rate": 1.3160464354972873e-06, "loss": 1.1536, "step": 22152 }, { "epoch": 0.67, "learning_rate": 1.3158316085406745e-06, "loss": 1.2216, "step": 22153 }, { "epoch": 0.67, "learning_rate": 1.3156167928567743e-06, "loss": 1.1122, "step": 22154 }, { "epoch": 0.67, "learning_rate": 1.3154019884476327e-06, "loss": 1.1332, "step": 22155 }, { "epoch": 0.67, "learning_rate": 1.3151871953152925e-06, "loss": 1.0954, "step": 22156 }, { "epoch": 0.67, "learning_rate": 1.3149724134617997e-06, "loss": 1.1279, "step": 22157 }, { "epoch": 0.67, "learning_rate": 1.3147576428891989e-06, "loss": 1.0782, "step": 22158 }, { "epoch": 0.67, "learning_rate": 1.3145428835995355e-06, "loss": 1.1697, "step": 22159 }, { "epoch": 0.67, "learning_rate": 1.3143281355948517e-06, "loss": 1.1581, "step": 22160 }, { "epoch": 0.67, "learning_rate": 1.3141133988771932e-06, "loss": 1.1005, "step": 22161 }, { "epoch": 0.67, "learning_rate": 1.3138986734486039e-06, "loss": 0.958, "step": 22162 }, { "epoch": 0.67, "learning_rate": 1.313683959311129e-06, "loss": 1.0719, "step": 22163 }, { "epoch": 0.67, "learning_rate": 1.3134692564668105e-06, "loss": 1.1192, "step": 22164 }, { "epoch": 0.67, "learning_rate": 1.3132545649176934e-06, "loss": 1.1234, "step": 22165 }, { "epoch": 0.67, "learning_rate": 1.313039884665821e-06, "loss": 1.1715, "step": 22166 }, { "epoch": 0.67, "learning_rate": 1.3128252157132376e-06, "loss": 1.155, "step": 22167 }, { "epoch": 0.67, "learning_rate": 1.3126105580619868e-06, "loss": 1.0906, "step": 22168 }, { "epoch": 0.67, "learning_rate": 1.312395911714111e-06, "loss": 1.1011, "step": 22169 }, { "epoch": 0.67, "learning_rate": 1.312181276671654e-06, "loss": 1.121, "step": 22170 }, { "epoch": 0.67, "learning_rate": 1.3119666529366595e-06, "loss": 1.0916, "step": 22171 }, { "epoch": 0.67, "learning_rate": 1.311752040511171e-06, "loss": 1.1381, "step": 22172 }, { "epoch": 0.67, "learning_rate": 1.31153743939723e-06, "loss": 1.0255, "step": 22173 }, { "epoch": 0.67, "learning_rate": 1.31132284959688e-06, "loss": 1.166, "step": 22174 }, { "epoch": 0.67, "learning_rate": 1.3111082711121642e-06, "loss": 1.0934, "step": 22175 }, { "epoch": 0.67, "learning_rate": 1.3108937039451248e-06, "loss": 1.0748, "step": 22176 }, { "epoch": 0.67, "learning_rate": 1.3106791480978047e-06, "loss": 1.0931, "step": 22177 }, { "epoch": 0.67, "learning_rate": 1.3104646035722462e-06, "loss": 1.035, "step": 22178 }, { "epoch": 0.67, "learning_rate": 1.3102500703704923e-06, "loss": 1.1385, "step": 22179 }, { "epoch": 0.67, "learning_rate": 1.3100355484945842e-06, "loss": 1.2681, "step": 22180 }, { "epoch": 0.67, "learning_rate": 1.309821037946566e-06, "loss": 1.0497, "step": 22181 }, { "epoch": 0.67, "learning_rate": 1.3096065387284768e-06, "loss": 1.0649, "step": 22182 }, { "epoch": 0.67, "learning_rate": 1.3093920508423602e-06, "loss": 1.096, "step": 22183 }, { "epoch": 0.67, "learning_rate": 1.309177574290258e-06, "loss": 1.1543, "step": 22184 }, { "epoch": 0.67, "learning_rate": 1.3089631090742128e-06, "loss": 1.2075, "step": 22185 }, { "epoch": 0.67, "learning_rate": 1.3087486551962642e-06, "loss": 1.1428, "step": 22186 }, { "epoch": 0.67, "learning_rate": 1.3085342126584545e-06, "loss": 1.032, "step": 22187 }, { "epoch": 0.67, "learning_rate": 1.3083197814628255e-06, "loss": 1.0955, "step": 22188 }, { "epoch": 0.67, "learning_rate": 1.308105361611419e-06, "loss": 1.0965, "step": 22189 }, { "epoch": 0.67, "learning_rate": 1.3078909531062744e-06, "loss": 1.1328, "step": 22190 }, { "epoch": 0.67, "learning_rate": 1.307676555949434e-06, "loss": 1.1356, "step": 22191 }, { "epoch": 0.67, "learning_rate": 1.3074621701429385e-06, "loss": 1.1433, "step": 22192 }, { "epoch": 0.67, "learning_rate": 1.3072477956888286e-06, "loss": 1.1979, "step": 22193 }, { "epoch": 0.67, "learning_rate": 1.3070334325891464e-06, "loss": 1.0352, "step": 22194 }, { "epoch": 0.67, "learning_rate": 1.3068190808459302e-06, "loss": 1.1293, "step": 22195 }, { "epoch": 0.67, "learning_rate": 1.3066047404612219e-06, "loss": 1.0235, "step": 22196 }, { "epoch": 0.67, "learning_rate": 1.3063904114370617e-06, "loss": 1.1895, "step": 22197 }, { "epoch": 0.67, "learning_rate": 1.3061760937754907e-06, "loss": 1.096, "step": 22198 }, { "epoch": 0.67, "learning_rate": 1.3059617874785476e-06, "loss": 1.1606, "step": 22199 }, { "epoch": 0.67, "learning_rate": 1.3057474925482732e-06, "loss": 1.0558, "step": 22200 }, { "epoch": 0.67, "learning_rate": 1.3055332089867074e-06, "loss": 1.0503, "step": 22201 }, { "epoch": 0.67, "learning_rate": 1.3053189367958903e-06, "loss": 1.1602, "step": 22202 }, { "epoch": 0.67, "learning_rate": 1.3051046759778613e-06, "loss": 1.0921, "step": 22203 }, { "epoch": 0.67, "learning_rate": 1.3048904265346603e-06, "loss": 1.1198, "step": 22204 }, { "epoch": 0.67, "learning_rate": 1.3046761884683273e-06, "loss": 1.1635, "step": 22205 }, { "epoch": 0.67, "learning_rate": 1.3044619617809006e-06, "loss": 1.1, "step": 22206 }, { "epoch": 0.67, "learning_rate": 1.3042477464744218e-06, "loss": 1.1644, "step": 22207 }, { "epoch": 0.67, "learning_rate": 1.3040335425509276e-06, "loss": 1.1268, "step": 22208 }, { "epoch": 0.67, "learning_rate": 1.3038193500124577e-06, "loss": 1.0648, "step": 22209 }, { "epoch": 0.67, "learning_rate": 1.3036051688610518e-06, "loss": 1.1693, "step": 22210 }, { "epoch": 0.67, "learning_rate": 1.3033909990987492e-06, "loss": 1.202, "step": 22211 }, { "epoch": 0.67, "learning_rate": 1.3031768407275868e-06, "loss": 1.105, "step": 22212 }, { "epoch": 0.67, "learning_rate": 1.302962693749605e-06, "loss": 1.0158, "step": 22213 }, { "epoch": 0.67, "learning_rate": 1.3027485581668418e-06, "loss": 1.1407, "step": 22214 }, { "epoch": 0.67, "learning_rate": 1.3025344339813365e-06, "loss": 1.1387, "step": 22215 }, { "epoch": 0.67, "learning_rate": 1.3023203211951258e-06, "loss": 1.0759, "step": 22216 }, { "epoch": 0.67, "learning_rate": 1.3021062198102486e-06, "loss": 1.0693, "step": 22217 }, { "epoch": 0.67, "learning_rate": 1.3018921298287435e-06, "loss": 1.1133, "step": 22218 }, { "epoch": 0.67, "learning_rate": 1.301678051252648e-06, "loss": 1.0798, "step": 22219 }, { "epoch": 0.67, "learning_rate": 1.3014639840840015e-06, "loss": 1.1681, "step": 22220 }, { "epoch": 0.67, "learning_rate": 1.3012499283248397e-06, "loss": 1.1669, "step": 22221 }, { "epoch": 0.67, "learning_rate": 1.3010358839772011e-06, "loss": 1.2258, "step": 22222 }, { "epoch": 0.67, "learning_rate": 1.3008218510431236e-06, "loss": 1.1819, "step": 22223 }, { "epoch": 0.67, "learning_rate": 1.3006078295246454e-06, "loss": 1.1669, "step": 22224 }, { "epoch": 0.67, "learning_rate": 1.300393819423802e-06, "loss": 1.2757, "step": 22225 }, { "epoch": 0.67, "learning_rate": 1.300179820742632e-06, "loss": 1.1293, "step": 22226 }, { "epoch": 0.67, "learning_rate": 1.2999658334831718e-06, "loss": 1.179, "step": 22227 }, { "epoch": 0.67, "learning_rate": 1.2997518576474593e-06, "loss": 1.0833, "step": 22228 }, { "epoch": 0.67, "learning_rate": 1.2995378932375308e-06, "loss": 1.1406, "step": 22229 }, { "epoch": 0.67, "learning_rate": 1.2993239402554236e-06, "loss": 0.9881, "step": 22230 }, { "epoch": 0.67, "learning_rate": 1.2991099987031742e-06, "loss": 1.1295, "step": 22231 }, { "epoch": 0.67, "learning_rate": 1.29889606858282e-06, "loss": 1.1173, "step": 22232 }, { "epoch": 0.67, "learning_rate": 1.2986821498963958e-06, "loss": 1.1003, "step": 22233 }, { "epoch": 0.67, "learning_rate": 1.2984682426459388e-06, "loss": 1.1024, "step": 22234 }, { "epoch": 0.67, "learning_rate": 1.298254346833486e-06, "loss": 1.1473, "step": 22235 }, { "epoch": 0.67, "learning_rate": 1.2980404624610726e-06, "loss": 1.149, "step": 22236 }, { "epoch": 0.67, "learning_rate": 1.2978265895307363e-06, "loss": 1.1375, "step": 22237 }, { "epoch": 0.67, "learning_rate": 1.2976127280445108e-06, "loss": 1.0438, "step": 22238 }, { "epoch": 0.67, "learning_rate": 1.2973988780044334e-06, "loss": 1.0008, "step": 22239 }, { "epoch": 0.67, "learning_rate": 1.297185039412539e-06, "loss": 0.9544, "step": 22240 }, { "epoch": 0.67, "learning_rate": 1.296971212270865e-06, "loss": 1.1687, "step": 22241 }, { "epoch": 0.67, "learning_rate": 1.2967573965814446e-06, "loss": 1.1274, "step": 22242 }, { "epoch": 0.67, "learning_rate": 1.296543592346314e-06, "loss": 1.1724, "step": 22243 }, { "epoch": 0.67, "learning_rate": 1.2963297995675089e-06, "loss": 1.2339, "step": 22244 }, { "epoch": 0.67, "learning_rate": 1.2961160182470647e-06, "loss": 1.0568, "step": 22245 }, { "epoch": 0.67, "learning_rate": 1.295902248387017e-06, "loss": 1.1567, "step": 22246 }, { "epoch": 0.67, "learning_rate": 1.295688489989399e-06, "loss": 1.1395, "step": 22247 }, { "epoch": 0.67, "learning_rate": 1.2954747430562465e-06, "loss": 1.1824, "step": 22248 }, { "epoch": 0.67, "learning_rate": 1.2952610075895945e-06, "loss": 1.0301, "step": 22249 }, { "epoch": 0.67, "learning_rate": 1.2950472835914784e-06, "loss": 1.0909, "step": 22250 }, { "epoch": 0.67, "learning_rate": 1.2948335710639309e-06, "loss": 1.1102, "step": 22251 }, { "epoch": 0.67, "learning_rate": 1.2946198700089874e-06, "loss": 1.0816, "step": 22252 }, { "epoch": 0.67, "learning_rate": 1.294406180428682e-06, "loss": 1.0491, "step": 22253 }, { "epoch": 0.67, "learning_rate": 1.29419250232505e-06, "loss": 1.184, "step": 22254 }, { "epoch": 0.67, "learning_rate": 1.293978835700124e-06, "loss": 1.0838, "step": 22255 }, { "epoch": 0.67, "learning_rate": 1.2937651805559388e-06, "loss": 1.0694, "step": 22256 }, { "epoch": 0.67, "learning_rate": 1.2935515368945275e-06, "loss": 1.0904, "step": 22257 }, { "epoch": 0.67, "learning_rate": 1.293337904717925e-06, "loss": 1.0937, "step": 22258 }, { "epoch": 0.67, "learning_rate": 1.2931242840281644e-06, "loss": 1.1373, "step": 22259 }, { "epoch": 0.67, "learning_rate": 1.2929106748272794e-06, "loss": 1.0228, "step": 22260 }, { "epoch": 0.67, "learning_rate": 1.2926970771173033e-06, "loss": 1.087, "step": 22261 }, { "epoch": 0.67, "learning_rate": 1.2924834909002698e-06, "loss": 1.1514, "step": 22262 }, { "epoch": 0.67, "learning_rate": 1.2922699161782126e-06, "loss": 1.0674, "step": 22263 }, { "epoch": 0.67, "learning_rate": 1.2920563529531632e-06, "loss": 1.151, "step": 22264 }, { "epoch": 0.67, "learning_rate": 1.2918428012271556e-06, "loss": 1.1391, "step": 22265 }, { "epoch": 0.67, "learning_rate": 1.291629261002223e-06, "loss": 1.1081, "step": 22266 }, { "epoch": 0.67, "learning_rate": 1.2914157322803983e-06, "loss": 1.183, "step": 22267 }, { "epoch": 0.67, "learning_rate": 1.2912022150637133e-06, "loss": 1.1817, "step": 22268 }, { "epoch": 0.67, "learning_rate": 1.2909887093542006e-06, "loss": 1.1411, "step": 22269 }, { "epoch": 0.67, "learning_rate": 1.2907752151538932e-06, "loss": 1.1991, "step": 22270 }, { "epoch": 0.67, "learning_rate": 1.2905617324648244e-06, "loss": 1.1233, "step": 22271 }, { "epoch": 0.67, "learning_rate": 1.2903482612890244e-06, "loss": 1.1224, "step": 22272 }, { "epoch": 0.67, "learning_rate": 1.2901348016285265e-06, "loss": 1.0441, "step": 22273 }, { "epoch": 0.67, "learning_rate": 1.2899213534853624e-06, "loss": 1.1248, "step": 22274 }, { "epoch": 0.67, "learning_rate": 1.2897079168615645e-06, "loss": 1.167, "step": 22275 }, { "epoch": 0.67, "learning_rate": 1.289494491759165e-06, "loss": 1.1724, "step": 22276 }, { "epoch": 0.67, "learning_rate": 1.289281078180194e-06, "loss": 1.1559, "step": 22277 }, { "epoch": 0.67, "learning_rate": 1.2890676761266843e-06, "loss": 1.0523, "step": 22278 }, { "epoch": 0.67, "learning_rate": 1.288854285600667e-06, "loss": 1.0917, "step": 22279 }, { "epoch": 0.67, "learning_rate": 1.2886409066041744e-06, "loss": 0.9974, "step": 22280 }, { "epoch": 0.67, "learning_rate": 1.2884275391392362e-06, "loss": 1.0225, "step": 22281 }, { "epoch": 0.67, "learning_rate": 1.2882141832078842e-06, "loss": 1.1248, "step": 22282 }, { "epoch": 0.67, "learning_rate": 1.2880008388121494e-06, "loss": 1.1046, "step": 22283 }, { "epoch": 0.67, "learning_rate": 1.2877875059540635e-06, "loss": 1.0726, "step": 22284 }, { "epoch": 0.67, "learning_rate": 1.287574184635656e-06, "loss": 1.1389, "step": 22285 }, { "epoch": 0.67, "learning_rate": 1.2873608748589589e-06, "loss": 1.1449, "step": 22286 }, { "epoch": 0.67, "learning_rate": 1.2871475766260017e-06, "loss": 1.169, "step": 22287 }, { "epoch": 0.67, "learning_rate": 1.286934289938816e-06, "loss": 1.1645, "step": 22288 }, { "epoch": 0.67, "learning_rate": 1.2867210147994321e-06, "loss": 1.0855, "step": 22289 }, { "epoch": 0.67, "learning_rate": 1.2865077512098788e-06, "loss": 1.0854, "step": 22290 }, { "epoch": 0.67, "learning_rate": 1.286294499172188e-06, "loss": 1.1521, "step": 22291 }, { "epoch": 0.67, "learning_rate": 1.2860812586883884e-06, "loss": 1.0928, "step": 22292 }, { "epoch": 0.67, "learning_rate": 1.2858680297605117e-06, "loss": 1.2197, "step": 22293 }, { "epoch": 0.67, "learning_rate": 1.2856548123905858e-06, "loss": 1.1119, "step": 22294 }, { "epoch": 0.67, "learning_rate": 1.2854416065806408e-06, "loss": 1.0723, "step": 22295 }, { "epoch": 0.67, "learning_rate": 1.2852284123327073e-06, "loss": 1.1687, "step": 22296 }, { "epoch": 0.67, "learning_rate": 1.285015229648815e-06, "loss": 1.1152, "step": 22297 }, { "epoch": 0.67, "learning_rate": 1.2848020585309912e-06, "loss": 1.0977, "step": 22298 }, { "epoch": 0.67, "learning_rate": 1.2845888989812673e-06, "loss": 1.2162, "step": 22299 }, { "epoch": 0.67, "learning_rate": 1.2843757510016712e-06, "loss": 1.0663, "step": 22300 }, { "epoch": 0.67, "learning_rate": 1.2841626145942326e-06, "loss": 1.171, "step": 22301 }, { "epoch": 0.67, "learning_rate": 1.2839494897609811e-06, "loss": 1.0694, "step": 22302 }, { "epoch": 0.67, "learning_rate": 1.283736376503944e-06, "loss": 1.1304, "step": 22303 }, { "epoch": 0.67, "learning_rate": 1.283523274825151e-06, "loss": 1.152, "step": 22304 }, { "epoch": 0.67, "learning_rate": 1.2833101847266305e-06, "loss": 1.1376, "step": 22305 }, { "epoch": 0.67, "learning_rate": 1.283097106210412e-06, "loss": 1.2144, "step": 22306 }, { "epoch": 0.67, "learning_rate": 1.2828840392785218e-06, "loss": 1.1374, "step": 22307 }, { "epoch": 0.67, "learning_rate": 1.2826709839329893e-06, "loss": 1.0244, "step": 22308 }, { "epoch": 0.67, "learning_rate": 1.282457940175843e-06, "loss": 1.097, "step": 22309 }, { "epoch": 0.67, "learning_rate": 1.2822449080091107e-06, "loss": 1.1774, "step": 22310 }, { "epoch": 0.67, "learning_rate": 1.2820318874348202e-06, "loss": 1.2188, "step": 22311 }, { "epoch": 0.67, "learning_rate": 1.2818188784549999e-06, "loss": 1.2914, "step": 22312 }, { "epoch": 0.67, "learning_rate": 1.281605881071677e-06, "loss": 1.144, "step": 22313 }, { "epoch": 0.67, "learning_rate": 1.2813928952868802e-06, "loss": 1.0444, "step": 22314 }, { "epoch": 0.67, "learning_rate": 1.2811799211026352e-06, "loss": 1.0496, "step": 22315 }, { "epoch": 0.67, "learning_rate": 1.2809669585209705e-06, "loss": 1.0735, "step": 22316 }, { "epoch": 0.67, "learning_rate": 1.280754007543913e-06, "loss": 1.1067, "step": 22317 }, { "epoch": 0.67, "learning_rate": 1.2805410681734903e-06, "loss": 1.1324, "step": 22318 }, { "epoch": 0.67, "learning_rate": 1.28032814041173e-06, "loss": 1.0704, "step": 22319 }, { "epoch": 0.67, "learning_rate": 1.2801152242606579e-06, "loss": 1.0414, "step": 22320 }, { "epoch": 0.67, "learning_rate": 1.2799023197223008e-06, "loss": 1.115, "step": 22321 }, { "epoch": 0.67, "learning_rate": 1.2796894267986864e-06, "loss": 1.0399, "step": 22322 }, { "epoch": 0.67, "learning_rate": 1.2794765454918417e-06, "loss": 1.1897, "step": 22323 }, { "epoch": 0.67, "learning_rate": 1.279263675803792e-06, "loss": 1.1593, "step": 22324 }, { "epoch": 0.67, "learning_rate": 1.2790508177365635e-06, "loss": 1.0782, "step": 22325 }, { "epoch": 0.67, "learning_rate": 1.2788379712921835e-06, "loss": 1.1407, "step": 22326 }, { "epoch": 0.67, "learning_rate": 1.2786251364726779e-06, "loss": 1.0428, "step": 22327 }, { "epoch": 0.67, "learning_rate": 1.2784123132800736e-06, "loss": 1.1679, "step": 22328 }, { "epoch": 0.67, "learning_rate": 1.2781995017163951e-06, "loss": 1.2275, "step": 22329 }, { "epoch": 0.67, "learning_rate": 1.2779867017836683e-06, "loss": 1.2127, "step": 22330 }, { "epoch": 0.67, "learning_rate": 1.27777391348392e-06, "loss": 1.1552, "step": 22331 }, { "epoch": 0.67, "learning_rate": 1.2775611368191765e-06, "loss": 1.0325, "step": 22332 }, { "epoch": 0.67, "learning_rate": 1.2773483717914609e-06, "loss": 1.0562, "step": 22333 }, { "epoch": 0.67, "learning_rate": 1.2771356184028e-06, "loss": 1.1527, "step": 22334 }, { "epoch": 0.67, "learning_rate": 1.2769228766552194e-06, "loss": 1.1168, "step": 22335 }, { "epoch": 0.67, "learning_rate": 1.2767101465507448e-06, "loss": 1.0768, "step": 22336 }, { "epoch": 0.67, "learning_rate": 1.276497428091399e-06, "loss": 1.137, "step": 22337 }, { "epoch": 0.67, "learning_rate": 1.276284721279209e-06, "loss": 1.0021, "step": 22338 }, { "epoch": 0.67, "learning_rate": 1.2760720261161988e-06, "loss": 1.0533, "step": 22339 }, { "epoch": 0.67, "learning_rate": 1.2758593426043936e-06, "loss": 0.9745, "step": 22340 }, { "epoch": 0.67, "learning_rate": 1.2756466707458176e-06, "loss": 1.1995, "step": 22341 }, { "epoch": 0.67, "learning_rate": 1.2754340105424962e-06, "loss": 1.1643, "step": 22342 }, { "epoch": 0.67, "learning_rate": 1.2752213619964527e-06, "loss": 1.1633, "step": 22343 }, { "epoch": 0.67, "learning_rate": 1.275008725109712e-06, "loss": 1.0263, "step": 22344 }, { "epoch": 0.67, "learning_rate": 1.2747960998842996e-06, "loss": 1.1997, "step": 22345 }, { "epoch": 0.67, "learning_rate": 1.2745834863222372e-06, "loss": 1.0244, "step": 22346 }, { "epoch": 0.67, "learning_rate": 1.2743708844255494e-06, "loss": 1.0613, "step": 22347 }, { "epoch": 0.67, "learning_rate": 1.274158294196261e-06, "loss": 1.0489, "step": 22348 }, { "epoch": 0.67, "learning_rate": 1.273945715636396e-06, "loss": 1.019, "step": 22349 }, { "epoch": 0.67, "learning_rate": 1.2737331487479764e-06, "loss": 1.2011, "step": 22350 }, { "epoch": 0.67, "learning_rate": 1.2735205935330264e-06, "loss": 1.1447, "step": 22351 }, { "epoch": 0.67, "learning_rate": 1.27330804999357e-06, "loss": 1.1102, "step": 22352 }, { "epoch": 0.67, "learning_rate": 1.2730955181316302e-06, "loss": 1.0073, "step": 22353 }, { "epoch": 0.67, "learning_rate": 1.2728829979492308e-06, "loss": 1.1382, "step": 22354 }, { "epoch": 0.67, "learning_rate": 1.2726704894483933e-06, "loss": 1.0342, "step": 22355 }, { "epoch": 0.67, "learning_rate": 1.272457992631142e-06, "loss": 1.2133, "step": 22356 }, { "epoch": 0.67, "learning_rate": 1.2722455074994988e-06, "loss": 0.9846, "step": 22357 }, { "epoch": 0.67, "learning_rate": 1.2720330340554887e-06, "loss": 1.0847, "step": 22358 }, { "epoch": 0.67, "learning_rate": 1.2718205723011311e-06, "loss": 1.0427, "step": 22359 }, { "epoch": 0.67, "learning_rate": 1.2716081222384508e-06, "loss": 1.1266, "step": 22360 }, { "epoch": 0.67, "learning_rate": 1.271395683869469e-06, "loss": 1.0841, "step": 22361 }, { "epoch": 0.67, "learning_rate": 1.2711832571962102e-06, "loss": 1.1688, "step": 22362 }, { "epoch": 0.67, "learning_rate": 1.2709708422206935e-06, "loss": 0.9962, "step": 22363 }, { "epoch": 0.67, "learning_rate": 1.2707584389449423e-06, "loss": 1.0579, "step": 22364 }, { "epoch": 0.67, "learning_rate": 1.270546047370979e-06, "loss": 1.0505, "step": 22365 }, { "epoch": 0.67, "learning_rate": 1.2703336675008254e-06, "loss": 1.1349, "step": 22366 }, { "epoch": 0.67, "learning_rate": 1.2701212993365029e-06, "loss": 1.0925, "step": 22367 }, { "epoch": 0.67, "learning_rate": 1.2699089428800333e-06, "loss": 1.0722, "step": 22368 }, { "epoch": 0.67, "learning_rate": 1.269696598133438e-06, "loss": 1.0389, "step": 22369 }, { "epoch": 0.67, "learning_rate": 1.2694842650987387e-06, "loss": 1.1258, "step": 22370 }, { "epoch": 0.67, "learning_rate": 1.2692719437779575e-06, "loss": 1.0491, "step": 22371 }, { "epoch": 0.67, "learning_rate": 1.2690596341731138e-06, "loss": 1.0667, "step": 22372 }, { "epoch": 0.67, "learning_rate": 1.2688473362862292e-06, "loss": 1.1784, "step": 22373 }, { "epoch": 0.67, "learning_rate": 1.268635050119325e-06, "loss": 1.2067, "step": 22374 }, { "epoch": 0.67, "learning_rate": 1.2684227756744232e-06, "loss": 1.0261, "step": 22375 }, { "epoch": 0.67, "learning_rate": 1.2682105129535427e-06, "loss": 0.9966, "step": 22376 }, { "epoch": 0.67, "learning_rate": 1.2679982619587048e-06, "loss": 1.0653, "step": 22377 }, { "epoch": 0.67, "learning_rate": 1.26778602269193e-06, "loss": 1.0443, "step": 22378 }, { "epoch": 0.67, "learning_rate": 1.2675737951552386e-06, "loss": 1.0745, "step": 22379 }, { "epoch": 0.67, "learning_rate": 1.2673615793506524e-06, "loss": 1.1529, "step": 22380 }, { "epoch": 0.67, "learning_rate": 1.2671493752801894e-06, "loss": 1.1239, "step": 22381 }, { "epoch": 0.67, "learning_rate": 1.2669371829458703e-06, "loss": 1.0515, "step": 22382 }, { "epoch": 0.67, "learning_rate": 1.2667250023497153e-06, "loss": 1.0035, "step": 22383 }, { "epoch": 0.67, "learning_rate": 1.2665128334937454e-06, "loss": 1.0195, "step": 22384 }, { "epoch": 0.67, "learning_rate": 1.2663006763799785e-06, "loss": 1.1288, "step": 22385 }, { "epoch": 0.67, "learning_rate": 1.2660885310104349e-06, "loss": 1.1557, "step": 22386 }, { "epoch": 0.67, "learning_rate": 1.2658763973871341e-06, "loss": 1.0052, "step": 22387 }, { "epoch": 0.67, "learning_rate": 1.2656642755120965e-06, "loss": 1.0478, "step": 22388 }, { "epoch": 0.67, "learning_rate": 1.2654521653873397e-06, "loss": 1.1479, "step": 22389 }, { "epoch": 0.67, "learning_rate": 1.2652400670148834e-06, "loss": 1.1489, "step": 22390 }, { "epoch": 0.67, "learning_rate": 1.2650279803967475e-06, "loss": 1.1216, "step": 22391 }, { "epoch": 0.67, "learning_rate": 1.2648159055349502e-06, "loss": 1.1547, "step": 22392 }, { "epoch": 0.67, "learning_rate": 1.2646038424315104e-06, "loss": 1.1546, "step": 22393 }, { "epoch": 0.67, "learning_rate": 1.2643917910884473e-06, "loss": 1.0611, "step": 22394 }, { "epoch": 0.67, "learning_rate": 1.2641797515077791e-06, "loss": 1.0898, "step": 22395 }, { "epoch": 0.67, "learning_rate": 1.263967723691525e-06, "loss": 1.1392, "step": 22396 }, { "epoch": 0.67, "learning_rate": 1.263755707641703e-06, "loss": 1.0291, "step": 22397 }, { "epoch": 0.67, "learning_rate": 1.2635437033603309e-06, "loss": 1.2193, "step": 22398 }, { "epoch": 0.67, "learning_rate": 1.263331710849427e-06, "loss": 1.1814, "step": 22399 }, { "epoch": 0.67, "learning_rate": 1.2631197301110098e-06, "loss": 1.1661, "step": 22400 }, { "epoch": 0.67, "learning_rate": 1.2629077611470978e-06, "loss": 1.107, "step": 22401 }, { "epoch": 0.67, "learning_rate": 1.262695803959707e-06, "loss": 1.0596, "step": 22402 }, { "epoch": 0.67, "learning_rate": 1.2624838585508567e-06, "loss": 0.9703, "step": 22403 }, { "epoch": 0.67, "learning_rate": 1.262271924922564e-06, "loss": 1.091, "step": 22404 }, { "epoch": 0.67, "learning_rate": 1.262060003076846e-06, "loss": 1.1357, "step": 22405 }, { "epoch": 0.67, "learning_rate": 1.261848093015722e-06, "loss": 1.0426, "step": 22406 }, { "epoch": 0.68, "learning_rate": 1.2616361947412065e-06, "loss": 1.1805, "step": 22407 }, { "epoch": 0.68, "learning_rate": 1.2614243082553184e-06, "loss": 1.0908, "step": 22408 }, { "epoch": 0.68, "learning_rate": 1.2612124335600743e-06, "loss": 1.1237, "step": 22409 }, { "epoch": 0.68, "learning_rate": 1.2610005706574918e-06, "loss": 1.0723, "step": 22410 }, { "epoch": 0.68, "learning_rate": 1.2607887195495866e-06, "loss": 1.1862, "step": 22411 }, { "epoch": 0.68, "learning_rate": 1.2605768802383754e-06, "loss": 1.0884, "step": 22412 }, { "epoch": 0.68, "learning_rate": 1.260365052725876e-06, "loss": 1.0984, "step": 22413 }, { "epoch": 0.68, "learning_rate": 1.2601532370141051e-06, "loss": 1.0819, "step": 22414 }, { "epoch": 0.68, "learning_rate": 1.2599414331050775e-06, "loss": 1.0016, "step": 22415 }, { "epoch": 0.68, "learning_rate": 1.2597296410008098e-06, "loss": 1.0959, "step": 22416 }, { "epoch": 0.68, "learning_rate": 1.2595178607033187e-06, "loss": 1.0919, "step": 22417 }, { "epoch": 0.68, "learning_rate": 1.25930609221462e-06, "loss": 1.1732, "step": 22418 }, { "epoch": 0.68, "learning_rate": 1.2590943355367307e-06, "loss": 1.0515, "step": 22419 }, { "epoch": 0.68, "learning_rate": 1.258882590671665e-06, "loss": 1.1313, "step": 22420 }, { "epoch": 0.68, "learning_rate": 1.258670857621439e-06, "loss": 1.1244, "step": 22421 }, { "epoch": 0.68, "learning_rate": 1.2584591363880689e-06, "loss": 1.1128, "step": 22422 }, { "epoch": 0.68, "learning_rate": 1.2582474269735697e-06, "loss": 1.0789, "step": 22423 }, { "epoch": 0.68, "learning_rate": 1.2580357293799571e-06, "loss": 1.1168, "step": 22424 }, { "epoch": 0.68, "learning_rate": 1.257824043609246e-06, "loss": 1.1996, "step": 22425 }, { "epoch": 0.68, "learning_rate": 1.2576123696634518e-06, "loss": 1.0098, "step": 22426 }, { "epoch": 0.68, "learning_rate": 1.2574007075445907e-06, "loss": 1.0574, "step": 22427 }, { "epoch": 0.68, "learning_rate": 1.2571890572546753e-06, "loss": 1.1257, "step": 22428 }, { "epoch": 0.68, "learning_rate": 1.2569774187957212e-06, "loss": 1.0826, "step": 22429 }, { "epoch": 0.68, "learning_rate": 1.2567657921697437e-06, "loss": 1.1509, "step": 22430 }, { "epoch": 0.68, "learning_rate": 1.256554177378757e-06, "loss": 1.2027, "step": 22431 }, { "epoch": 0.68, "learning_rate": 1.256342574424777e-06, "loss": 1.1439, "step": 22432 }, { "epoch": 0.68, "learning_rate": 1.2561309833098154e-06, "loss": 1.2524, "step": 22433 }, { "epoch": 0.68, "learning_rate": 1.255919404035888e-06, "loss": 1.2092, "step": 22434 }, { "epoch": 0.68, "learning_rate": 1.2557078366050085e-06, "loss": 1.1979, "step": 22435 }, { "epoch": 0.68, "learning_rate": 1.2554962810191917e-06, "loss": 1.2656, "step": 22436 }, { "epoch": 0.68, "learning_rate": 1.2552847372804506e-06, "loss": 1.2827, "step": 22437 }, { "epoch": 0.68, "learning_rate": 1.2550732053907991e-06, "loss": 1.2135, "step": 22438 }, { "epoch": 0.68, "learning_rate": 1.254861685352251e-06, "loss": 1.1083, "step": 22439 }, { "epoch": 0.68, "learning_rate": 1.2546501771668213e-06, "loss": 1.0662, "step": 22440 }, { "epoch": 0.68, "learning_rate": 1.2544386808365208e-06, "loss": 1.1, "step": 22441 }, { "epoch": 0.68, "learning_rate": 1.2542271963633646e-06, "loss": 1.1137, "step": 22442 }, { "epoch": 0.68, "learning_rate": 1.254015723749365e-06, "loss": 1.1817, "step": 22443 }, { "epoch": 0.68, "learning_rate": 1.253804262996537e-06, "loss": 1.2043, "step": 22444 }, { "epoch": 0.68, "learning_rate": 1.2535928141068908e-06, "loss": 1.1085, "step": 22445 }, { "epoch": 0.68, "learning_rate": 1.253381377082441e-06, "loss": 1.1218, "step": 22446 }, { "epoch": 0.68, "learning_rate": 1.2531699519252e-06, "loss": 1.1373, "step": 22447 }, { "epoch": 0.68, "learning_rate": 1.2529585386371806e-06, "loss": 1.037, "step": 22448 }, { "epoch": 0.68, "learning_rate": 1.2527471372203953e-06, "loss": 1.2448, "step": 22449 }, { "epoch": 0.68, "learning_rate": 1.2525357476768569e-06, "loss": 1.0278, "step": 22450 }, { "epoch": 0.68, "learning_rate": 1.2523243700085768e-06, "loss": 1.0513, "step": 22451 }, { "epoch": 0.68, "learning_rate": 1.2521130042175682e-06, "loss": 1.0447, "step": 22452 }, { "epoch": 0.68, "learning_rate": 1.251901650305844e-06, "loss": 1.0433, "step": 22453 }, { "epoch": 0.68, "learning_rate": 1.2516903082754134e-06, "loss": 1.2138, "step": 22454 }, { "epoch": 0.68, "learning_rate": 1.2514789781282901e-06, "loss": 1.2064, "step": 22455 }, { "epoch": 0.68, "learning_rate": 1.2512676598664858e-06, "loss": 1.0774, "step": 22456 }, { "epoch": 0.68, "learning_rate": 1.2510563534920128e-06, "loss": 1.1293, "step": 22457 }, { "epoch": 0.68, "learning_rate": 1.2508450590068807e-06, "loss": 1.0903, "step": 22458 }, { "epoch": 0.68, "learning_rate": 1.250633776413102e-06, "loss": 1.0894, "step": 22459 }, { "epoch": 0.68, "learning_rate": 1.2504225057126884e-06, "loss": 1.0742, "step": 22460 }, { "epoch": 0.68, "learning_rate": 1.2502112469076505e-06, "loss": 1.0152, "step": 22461 }, { "epoch": 0.68, "learning_rate": 1.2500000000000007e-06, "loss": 1.3086, "step": 22462 }, { "epoch": 0.68, "learning_rate": 1.2497887649917479e-06, "loss": 0.9965, "step": 22463 }, { "epoch": 0.68, "learning_rate": 1.2495775418849038e-06, "loss": 1.0941, "step": 22464 }, { "epoch": 0.68, "learning_rate": 1.249366330681479e-06, "loss": 0.9777, "step": 22465 }, { "epoch": 0.68, "learning_rate": 1.2491551313834857e-06, "loss": 1.1506, "step": 22466 }, { "epoch": 0.68, "learning_rate": 1.2489439439929323e-06, "loss": 1.1647, "step": 22467 }, { "epoch": 0.68, "learning_rate": 1.2487327685118297e-06, "loss": 1.0942, "step": 22468 }, { "epoch": 0.68, "learning_rate": 1.2485216049421888e-06, "loss": 1.1649, "step": 22469 }, { "epoch": 0.68, "learning_rate": 1.2483104532860205e-06, "loss": 1.1071, "step": 22470 }, { "epoch": 0.68, "learning_rate": 1.2480993135453326e-06, "loss": 1.0986, "step": 22471 }, { "epoch": 0.68, "learning_rate": 1.2478881857221364e-06, "loss": 1.0969, "step": 22472 }, { "epoch": 0.68, "learning_rate": 1.2476770698184418e-06, "loss": 1.0773, "step": 22473 }, { "epoch": 0.68, "learning_rate": 1.247465965836258e-06, "loss": 1.142, "step": 22474 }, { "epoch": 0.68, "learning_rate": 1.2472548737775953e-06, "loss": 1.1619, "step": 22475 }, { "epoch": 0.68, "learning_rate": 1.2470437936444627e-06, "loss": 1.1449, "step": 22476 }, { "epoch": 0.68, "learning_rate": 1.2468327254388699e-06, "loss": 1.1125, "step": 22477 }, { "epoch": 0.68, "learning_rate": 1.2466216691628258e-06, "loss": 1.0253, "step": 22478 }, { "epoch": 0.68, "learning_rate": 1.2464106248183408e-06, "loss": 1.0981, "step": 22479 }, { "epoch": 0.68, "learning_rate": 1.2461995924074218e-06, "loss": 1.1323, "step": 22480 }, { "epoch": 0.68, "learning_rate": 1.245988571932079e-06, "loss": 1.2585, "step": 22481 }, { "epoch": 0.68, "learning_rate": 1.2457775633943212e-06, "loss": 1.0834, "step": 22482 }, { "epoch": 0.68, "learning_rate": 1.2455665667961574e-06, "loss": 1.1315, "step": 22483 }, { "epoch": 0.68, "learning_rate": 1.2453555821395953e-06, "loss": 1.1644, "step": 22484 }, { "epoch": 0.68, "learning_rate": 1.2451446094266434e-06, "loss": 1.0695, "step": 22485 }, { "epoch": 0.68, "learning_rate": 1.2449336486593108e-06, "loss": 1.1493, "step": 22486 }, { "epoch": 0.68, "learning_rate": 1.2447226998396053e-06, "loss": 1.231, "step": 22487 }, { "epoch": 0.68, "learning_rate": 1.2445117629695362e-06, "loss": 1.1914, "step": 22488 }, { "epoch": 0.68, "learning_rate": 1.244300838051109e-06, "loss": 1.0861, "step": 22489 }, { "epoch": 0.68, "learning_rate": 1.2440899250863333e-06, "loss": 1.0906, "step": 22490 }, { "epoch": 0.68, "learning_rate": 1.243879024077217e-06, "loss": 1.0978, "step": 22491 }, { "epoch": 0.68, "learning_rate": 1.2436681350257682e-06, "loss": 1.121, "step": 22492 }, { "epoch": 0.68, "learning_rate": 1.2434572579339926e-06, "loss": 1.1469, "step": 22493 }, { "epoch": 0.68, "learning_rate": 1.2432463928038988e-06, "loss": 1.0877, "step": 22494 }, { "epoch": 0.68, "learning_rate": 1.2430355396374938e-06, "loss": 1.0385, "step": 22495 }, { "epoch": 0.68, "learning_rate": 1.2428246984367865e-06, "loss": 1.1019, "step": 22496 }, { "epoch": 0.68, "learning_rate": 1.2426138692037815e-06, "loss": 1.0375, "step": 22497 }, { "epoch": 0.68, "learning_rate": 1.2424030519404866e-06, "loss": 1.114, "step": 22498 }, { "epoch": 0.68, "learning_rate": 1.2421922466489092e-06, "loss": 1.1953, "step": 22499 }, { "epoch": 0.68, "learning_rate": 1.241981453331056e-06, "loss": 1.152, "step": 22500 }, { "epoch": 0.68, "learning_rate": 1.2417706719889342e-06, "loss": 1.1515, "step": 22501 }, { "epoch": 0.68, "learning_rate": 1.2415599026245486e-06, "loss": 1.0394, "step": 22502 }, { "epoch": 0.68, "learning_rate": 1.2413491452399068e-06, "loss": 1.1287, "step": 22503 }, { "epoch": 0.68, "learning_rate": 1.241138399837015e-06, "loss": 1.0623, "step": 22504 }, { "epoch": 0.68, "learning_rate": 1.240927666417879e-06, "loss": 1.2261, "step": 22505 }, { "epoch": 0.68, "learning_rate": 1.2407169449845054e-06, "loss": 1.0241, "step": 22506 }, { "epoch": 0.68, "learning_rate": 1.2405062355389002e-06, "loss": 0.9746, "step": 22507 }, { "epoch": 0.68, "learning_rate": 1.2402955380830689e-06, "loss": 1.1019, "step": 22508 }, { "epoch": 0.68, "learning_rate": 1.2400848526190186e-06, "loss": 1.171, "step": 22509 }, { "epoch": 0.68, "learning_rate": 1.2398741791487523e-06, "loss": 1.0807, "step": 22510 }, { "epoch": 0.68, "learning_rate": 1.2396635176742773e-06, "loss": 1.106, "step": 22511 }, { "epoch": 0.68, "learning_rate": 1.2394528681975985e-06, "loss": 1.1535, "step": 22512 }, { "epoch": 0.68, "learning_rate": 1.239242230720721e-06, "loss": 1.1096, "step": 22513 }, { "epoch": 0.68, "learning_rate": 1.2390316052456513e-06, "loss": 1.0347, "step": 22514 }, { "epoch": 0.68, "learning_rate": 1.238820991774393e-06, "loss": 1.0245, "step": 22515 }, { "epoch": 0.68, "learning_rate": 1.238610390308951e-06, "loss": 1.0934, "step": 22516 }, { "epoch": 0.68, "learning_rate": 1.2383998008513304e-06, "loss": 1.21, "step": 22517 }, { "epoch": 0.68, "learning_rate": 1.2381892234035373e-06, "loss": 1.1783, "step": 22518 }, { "epoch": 0.68, "learning_rate": 1.2379786579675742e-06, "loss": 1.0234, "step": 22519 }, { "epoch": 0.68, "learning_rate": 1.2377681045454462e-06, "loss": 1.1915, "step": 22520 }, { "epoch": 0.68, "learning_rate": 1.2375575631391581e-06, "loss": 0.9986, "step": 22521 }, { "epoch": 0.68, "learning_rate": 1.2373470337507152e-06, "loss": 1.1127, "step": 22522 }, { "epoch": 0.68, "learning_rate": 1.237136516382119e-06, "loss": 1.215, "step": 22523 }, { "epoch": 0.68, "learning_rate": 1.2369260110353753e-06, "loss": 1.095, "step": 22524 }, { "epoch": 0.68, "learning_rate": 1.2367155177124875e-06, "loss": 1.1147, "step": 22525 }, { "epoch": 0.68, "learning_rate": 1.2365050364154597e-06, "loss": 1.0673, "step": 22526 }, { "epoch": 0.68, "learning_rate": 1.2362945671462962e-06, "loss": 1.1204, "step": 22527 }, { "epoch": 0.68, "learning_rate": 1.236084109906999e-06, "loss": 1.0313, "step": 22528 }, { "epoch": 0.68, "learning_rate": 1.235873664699572e-06, "loss": 1.0565, "step": 22529 }, { "epoch": 0.68, "learning_rate": 1.2356632315260191e-06, "loss": 1.0845, "step": 22530 }, { "epoch": 0.68, "learning_rate": 1.2354528103883434e-06, "loss": 1.0934, "step": 22531 }, { "epoch": 0.68, "learning_rate": 1.2352424012885481e-06, "loss": 1.1656, "step": 22532 }, { "epoch": 0.68, "learning_rate": 1.2350320042286357e-06, "loss": 1.1103, "step": 22533 }, { "epoch": 0.68, "learning_rate": 1.2348216192106094e-06, "loss": 1.0652, "step": 22534 }, { "epoch": 0.68, "learning_rate": 1.234611246236473e-06, "loss": 1.1824, "step": 22535 }, { "epoch": 0.68, "learning_rate": 1.234400885308227e-06, "loss": 1.0552, "step": 22536 }, { "epoch": 0.68, "learning_rate": 1.2341905364278753e-06, "loss": 1.1255, "step": 22537 }, { "epoch": 0.68, "learning_rate": 1.23398019959742e-06, "loss": 0.9319, "step": 22538 }, { "epoch": 0.68, "learning_rate": 1.2337698748188633e-06, "loss": 1.106, "step": 22539 }, { "epoch": 0.68, "learning_rate": 1.2335595620942087e-06, "loss": 1.0623, "step": 22540 }, { "epoch": 0.68, "learning_rate": 1.2333492614254562e-06, "loss": 1.1225, "step": 22541 }, { "epoch": 0.68, "learning_rate": 1.2331389728146083e-06, "loss": 1.1459, "step": 22542 }, { "epoch": 0.68, "learning_rate": 1.2329286962636678e-06, "loss": 0.9971, "step": 22543 }, { "epoch": 0.68, "learning_rate": 1.2327184317746363e-06, "loss": 1.0696, "step": 22544 }, { "epoch": 0.68, "learning_rate": 1.2325081793495144e-06, "loss": 1.1097, "step": 22545 }, { "epoch": 0.68, "learning_rate": 1.2322979389903039e-06, "loss": 1.0261, "step": 22546 }, { "epoch": 0.68, "learning_rate": 1.2320877106990067e-06, "loss": 1.0314, "step": 22547 }, { "epoch": 0.68, "learning_rate": 1.2318774944776248e-06, "loss": 1.2423, "step": 22548 }, { "epoch": 0.68, "learning_rate": 1.2316672903281574e-06, "loss": 0.9827, "step": 22549 }, { "epoch": 0.68, "learning_rate": 1.2314570982526064e-06, "loss": 1.1042, "step": 22550 }, { "epoch": 0.68, "learning_rate": 1.2312469182529729e-06, "loss": 1.1759, "step": 22551 }, { "epoch": 0.68, "learning_rate": 1.231036750331258e-06, "loss": 1.0851, "step": 22552 }, { "epoch": 0.68, "learning_rate": 1.2308265944894627e-06, "loss": 1.1198, "step": 22553 }, { "epoch": 0.68, "learning_rate": 1.2306164507295862e-06, "loss": 1.1305, "step": 22554 }, { "epoch": 0.68, "learning_rate": 1.2304063190536297e-06, "loss": 1.1689, "step": 22555 }, { "epoch": 0.68, "learning_rate": 1.2301961994635936e-06, "loss": 1.2688, "step": 22556 }, { "epoch": 0.68, "learning_rate": 1.229986091961478e-06, "loss": 1.1635, "step": 22557 }, { "epoch": 0.68, "learning_rate": 1.229775996549283e-06, "loss": 1.0063, "step": 22558 }, { "epoch": 0.68, "learning_rate": 1.229565913229009e-06, "loss": 1.1738, "step": 22559 }, { "epoch": 0.68, "learning_rate": 1.2293558420026558e-06, "loss": 1.122, "step": 22560 }, { "epoch": 0.68, "learning_rate": 1.2291457828722236e-06, "loss": 1.1284, "step": 22561 }, { "epoch": 0.68, "learning_rate": 1.228935735839711e-06, "loss": 1.1744, "step": 22562 }, { "epoch": 0.68, "learning_rate": 1.2287257009071177e-06, "loss": 1.0715, "step": 22563 }, { "epoch": 0.68, "learning_rate": 1.2285156780764435e-06, "loss": 1.1505, "step": 22564 }, { "epoch": 0.68, "learning_rate": 1.2283056673496877e-06, "loss": 1.1368, "step": 22565 }, { "epoch": 0.68, "learning_rate": 1.2280956687288504e-06, "loss": 1.1049, "step": 22566 }, { "epoch": 0.68, "learning_rate": 1.2278856822159289e-06, "loss": 1.1083, "step": 22567 }, { "epoch": 0.68, "learning_rate": 1.227675707812923e-06, "loss": 1.2144, "step": 22568 }, { "epoch": 0.68, "learning_rate": 1.2274657455218314e-06, "loss": 1.2405, "step": 22569 }, { "epoch": 0.68, "learning_rate": 1.227255795344654e-06, "loss": 1.0905, "step": 22570 }, { "epoch": 0.68, "learning_rate": 1.2270458572833877e-06, "loss": 0.9848, "step": 22571 }, { "epoch": 0.68, "learning_rate": 1.2268359313400317e-06, "loss": 1.0214, "step": 22572 }, { "epoch": 0.68, "learning_rate": 1.2266260175165845e-06, "loss": 1.1828, "step": 22573 }, { "epoch": 0.68, "learning_rate": 1.2264161158150453e-06, "loss": 1.1345, "step": 22574 }, { "epoch": 0.68, "learning_rate": 1.2262062262374104e-06, "loss": 1.0627, "step": 22575 }, { "epoch": 0.68, "learning_rate": 1.2259963487856786e-06, "loss": 1.1841, "step": 22576 }, { "epoch": 0.68, "learning_rate": 1.225786483461848e-06, "loss": 1.0357, "step": 22577 }, { "epoch": 0.68, "learning_rate": 1.2255766302679162e-06, "loss": 1.1101, "step": 22578 }, { "epoch": 0.68, "learning_rate": 1.2253667892058824e-06, "loss": 1.118, "step": 22579 }, { "epoch": 0.68, "learning_rate": 1.2251569602777416e-06, "loss": 1.0269, "step": 22580 }, { "epoch": 0.68, "learning_rate": 1.224947143485493e-06, "loss": 1.1613, "step": 22581 }, { "epoch": 0.68, "learning_rate": 1.224737338831133e-06, "loss": 1.1467, "step": 22582 }, { "epoch": 0.68, "learning_rate": 1.2245275463166606e-06, "loss": 1.2018, "step": 22583 }, { "epoch": 0.68, "learning_rate": 1.2243177659440706e-06, "loss": 1.0483, "step": 22584 }, { "epoch": 0.68, "learning_rate": 1.224107997715361e-06, "loss": 1.1957, "step": 22585 }, { "epoch": 0.68, "learning_rate": 1.223898241632529e-06, "loss": 1.0377, "step": 22586 }, { "epoch": 0.68, "learning_rate": 1.2236884976975714e-06, "loss": 1.1046, "step": 22587 }, { "epoch": 0.68, "learning_rate": 1.2234787659124842e-06, "loss": 1.2022, "step": 22588 }, { "epoch": 0.68, "learning_rate": 1.2232690462792644e-06, "loss": 1.1337, "step": 22589 }, { "epoch": 0.68, "learning_rate": 1.2230593387999081e-06, "loss": 1.1712, "step": 22590 }, { "epoch": 0.68, "learning_rate": 1.2228496434764124e-06, "loss": 0.9797, "step": 22591 }, { "epoch": 0.68, "learning_rate": 1.222639960310774e-06, "loss": 1.1265, "step": 22592 }, { "epoch": 0.68, "learning_rate": 1.2224302893049867e-06, "loss": 1.233, "step": 22593 }, { "epoch": 0.68, "learning_rate": 1.2222206304610477e-06, "loss": 1.0897, "step": 22594 }, { "epoch": 0.68, "learning_rate": 1.222010983780953e-06, "loss": 1.0353, "step": 22595 }, { "epoch": 0.68, "learning_rate": 1.2218013492666991e-06, "loss": 1.1172, "step": 22596 }, { "epoch": 0.68, "learning_rate": 1.22159172692028e-06, "loss": 1.0707, "step": 22597 }, { "epoch": 0.68, "learning_rate": 1.2213821167436917e-06, "loss": 1.0392, "step": 22598 }, { "epoch": 0.68, "learning_rate": 1.2211725187389303e-06, "loss": 1.1397, "step": 22599 }, { "epoch": 0.68, "learning_rate": 1.2209629329079912e-06, "loss": 1.1588, "step": 22600 }, { "epoch": 0.68, "learning_rate": 1.220753359252868e-06, "loss": 1.0983, "step": 22601 }, { "epoch": 0.68, "learning_rate": 1.2205437977755569e-06, "loss": 0.9987, "step": 22602 }, { "epoch": 0.68, "learning_rate": 1.2203342484780526e-06, "loss": 1.0859, "step": 22603 }, { "epoch": 0.68, "learning_rate": 1.2201247113623498e-06, "loss": 1.1967, "step": 22604 }, { "epoch": 0.68, "learning_rate": 1.2199151864304446e-06, "loss": 1.0253, "step": 22605 }, { "epoch": 0.68, "learning_rate": 1.219705673684329e-06, "loss": 1.1096, "step": 22606 }, { "epoch": 0.68, "learning_rate": 1.219496173125999e-06, "loss": 1.1962, "step": 22607 }, { "epoch": 0.68, "learning_rate": 1.2192866847574485e-06, "loss": 1.085, "step": 22608 }, { "epoch": 0.68, "learning_rate": 1.2190772085806733e-06, "loss": 1.1018, "step": 22609 }, { "epoch": 0.68, "learning_rate": 1.218867744597665e-06, "loss": 1.1282, "step": 22610 }, { "epoch": 0.68, "learning_rate": 1.2186582928104184e-06, "loss": 1.097, "step": 22611 }, { "epoch": 0.68, "learning_rate": 1.2184488532209281e-06, "loss": 1.205, "step": 22612 }, { "epoch": 0.68, "learning_rate": 1.2182394258311875e-06, "loss": 1.1625, "step": 22613 }, { "epoch": 0.68, "learning_rate": 1.2180300106431903e-06, "loss": 1.0773, "step": 22614 }, { "epoch": 0.68, "learning_rate": 1.21782060765893e-06, "loss": 1.0444, "step": 22615 }, { "epoch": 0.68, "learning_rate": 1.2176112168803997e-06, "loss": 1.1731, "step": 22616 }, { "epoch": 0.68, "learning_rate": 1.2174018383095942e-06, "loss": 1.0687, "step": 22617 }, { "epoch": 0.68, "learning_rate": 1.2171924719485046e-06, "loss": 1.214, "step": 22618 }, { "epoch": 0.68, "learning_rate": 1.2169831177991246e-06, "loss": 1.1079, "step": 22619 }, { "epoch": 0.68, "learning_rate": 1.2167737758634474e-06, "loss": 1.0651, "step": 22620 }, { "epoch": 0.68, "learning_rate": 1.2165644461434661e-06, "loss": 1.0511, "step": 22621 }, { "epoch": 0.68, "learning_rate": 1.216355128641174e-06, "loss": 1.0323, "step": 22622 }, { "epoch": 0.68, "learning_rate": 1.2161458233585615e-06, "loss": 1.1478, "step": 22623 }, { "epoch": 0.68, "learning_rate": 1.215936530297623e-06, "loss": 1.1133, "step": 22624 }, { "epoch": 0.68, "learning_rate": 1.21572724946035e-06, "loss": 1.0923, "step": 22625 }, { "epoch": 0.68, "learning_rate": 1.2155179808487362e-06, "loss": 1.069, "step": 22626 }, { "epoch": 0.68, "learning_rate": 1.2153087244647716e-06, "loss": 1.1007, "step": 22627 }, { "epoch": 0.68, "learning_rate": 1.215099480310449e-06, "loss": 1.0779, "step": 22628 }, { "epoch": 0.68, "learning_rate": 1.2148902483877607e-06, "loss": 1.1089, "step": 22629 }, { "epoch": 0.68, "learning_rate": 1.2146810286986993e-06, "loss": 1.0577, "step": 22630 }, { "epoch": 0.68, "learning_rate": 1.2144718212452545e-06, "loss": 1.1959, "step": 22631 }, { "epoch": 0.68, "learning_rate": 1.2142626260294184e-06, "loss": 1.136, "step": 22632 }, { "epoch": 0.68, "learning_rate": 1.2140534430531834e-06, "loss": 1.1366, "step": 22633 }, { "epoch": 0.68, "learning_rate": 1.21384427231854e-06, "loss": 1.0593, "step": 22634 }, { "epoch": 0.68, "learning_rate": 1.213635113827481e-06, "loss": 1.1342, "step": 22635 }, { "epoch": 0.68, "learning_rate": 1.2134259675819948e-06, "loss": 1.0806, "step": 22636 }, { "epoch": 0.68, "learning_rate": 1.2132168335840742e-06, "loss": 1.043, "step": 22637 }, { "epoch": 0.68, "learning_rate": 1.2130077118357092e-06, "loss": 1.292, "step": 22638 }, { "epoch": 0.68, "learning_rate": 1.2127986023388914e-06, "loss": 1.1632, "step": 22639 }, { "epoch": 0.68, "learning_rate": 1.2125895050956105e-06, "loss": 1.1118, "step": 22640 }, { "epoch": 0.68, "learning_rate": 1.2123804201078575e-06, "loss": 1.076, "step": 22641 }, { "epoch": 0.68, "learning_rate": 1.2121713473776231e-06, "loss": 1.2072, "step": 22642 }, { "epoch": 0.68, "learning_rate": 1.2119622869068978e-06, "loss": 0.9997, "step": 22643 }, { "epoch": 0.68, "learning_rate": 1.2117532386976705e-06, "loss": 1.0544, "step": 22644 }, { "epoch": 0.68, "learning_rate": 1.211544202751932e-06, "loss": 1.0667, "step": 22645 }, { "epoch": 0.68, "learning_rate": 1.211335179071672e-06, "loss": 1.0084, "step": 22646 }, { "epoch": 0.68, "learning_rate": 1.2111261676588803e-06, "loss": 1.1343, "step": 22647 }, { "epoch": 0.68, "learning_rate": 1.210917168515548e-06, "loss": 1.0624, "step": 22648 }, { "epoch": 0.68, "learning_rate": 1.2107081816436623e-06, "loss": 1.2512, "step": 22649 }, { "epoch": 0.68, "learning_rate": 1.2104992070452136e-06, "loss": 1.1233, "step": 22650 }, { "epoch": 0.68, "learning_rate": 1.2102902447221918e-06, "loss": 1.0925, "step": 22651 }, { "epoch": 0.68, "learning_rate": 1.2100812946765864e-06, "loss": 1.1942, "step": 22652 }, { "epoch": 0.68, "learning_rate": 1.2098723569103848e-06, "loss": 1.1337, "step": 22653 }, { "epoch": 0.68, "learning_rate": 1.2096634314255774e-06, "loss": 1.1227, "step": 22654 }, { "epoch": 0.68, "learning_rate": 1.2094545182241524e-06, "loss": 1.1507, "step": 22655 }, { "epoch": 0.68, "learning_rate": 1.2092456173081e-06, "loss": 1.1219, "step": 22656 }, { "epoch": 0.68, "learning_rate": 1.2090367286794064e-06, "loss": 1.1354, "step": 22657 }, { "epoch": 0.68, "learning_rate": 1.2088278523400615e-06, "loss": 1.0496, "step": 22658 }, { "epoch": 0.68, "learning_rate": 1.2086189882920538e-06, "loss": 1.064, "step": 22659 }, { "epoch": 0.68, "learning_rate": 1.208410136537371e-06, "loss": 1.1466, "step": 22660 }, { "epoch": 0.68, "learning_rate": 1.208201297078003e-06, "loss": 1.252, "step": 22661 }, { "epoch": 0.68, "learning_rate": 1.2079924699159353e-06, "loss": 1.1389, "step": 22662 }, { "epoch": 0.68, "learning_rate": 1.2077836550531572e-06, "loss": 1.053, "step": 22663 }, { "epoch": 0.68, "learning_rate": 1.2075748524916562e-06, "loss": 1.1266, "step": 22664 }, { "epoch": 0.68, "learning_rate": 1.2073660622334203e-06, "loss": 1.2312, "step": 22665 }, { "epoch": 0.68, "learning_rate": 1.2071572842804377e-06, "loss": 1.1094, "step": 22666 }, { "epoch": 0.68, "learning_rate": 1.2069485186346943e-06, "loss": 0.9984, "step": 22667 }, { "epoch": 0.68, "learning_rate": 1.2067397652981782e-06, "loss": 1.1288, "step": 22668 }, { "epoch": 0.68, "learning_rate": 1.2065310242728766e-06, "loss": 1.2271, "step": 22669 }, { "epoch": 0.68, "learning_rate": 1.2063222955607768e-06, "loss": 0.987, "step": 22670 }, { "epoch": 0.68, "learning_rate": 1.2061135791638657e-06, "loss": 1.0954, "step": 22671 }, { "epoch": 0.68, "learning_rate": 1.20590487508413e-06, "loss": 0.9567, "step": 22672 }, { "epoch": 0.68, "learning_rate": 1.2056961833235566e-06, "loss": 1.0903, "step": 22673 }, { "epoch": 0.68, "learning_rate": 1.2054875038841334e-06, "loss": 1.2444, "step": 22674 }, { "epoch": 0.68, "learning_rate": 1.2052788367678447e-06, "loss": 1.0435, "step": 22675 }, { "epoch": 0.68, "learning_rate": 1.2050701819766777e-06, "loss": 1.0778, "step": 22676 }, { "epoch": 0.68, "learning_rate": 1.2048615395126193e-06, "loss": 1.1714, "step": 22677 }, { "epoch": 0.68, "learning_rate": 1.204652909377656e-06, "loss": 1.1367, "step": 22678 }, { "epoch": 0.68, "learning_rate": 1.2044442915737722e-06, "loss": 1.1035, "step": 22679 }, { "epoch": 0.68, "learning_rate": 1.2042356861029546e-06, "loss": 1.2017, "step": 22680 }, { "epoch": 0.68, "learning_rate": 1.2040270929671893e-06, "loss": 1.2068, "step": 22681 }, { "epoch": 0.68, "learning_rate": 1.203818512168463e-06, "loss": 1.2084, "step": 22682 }, { "epoch": 0.68, "learning_rate": 1.2036099437087592e-06, "loss": 1.1945, "step": 22683 }, { "epoch": 0.68, "learning_rate": 1.2034013875900644e-06, "loss": 1.1397, "step": 22684 }, { "epoch": 0.68, "learning_rate": 1.203192843814364e-06, "loss": 1.0063, "step": 22685 }, { "epoch": 0.68, "learning_rate": 1.2029843123836428e-06, "loss": 1.0599, "step": 22686 }, { "epoch": 0.68, "learning_rate": 1.2027757932998877e-06, "loss": 1.1437, "step": 22687 }, { "epoch": 0.68, "learning_rate": 1.2025672865650811e-06, "loss": 1.0885, "step": 22688 }, { "epoch": 0.68, "learning_rate": 1.202358792181209e-06, "loss": 1.1793, "step": 22689 }, { "epoch": 0.68, "learning_rate": 1.2021503101502563e-06, "loss": 1.1274, "step": 22690 }, { "epoch": 0.68, "learning_rate": 1.2019418404742087e-06, "loss": 1.1143, "step": 22691 }, { "epoch": 0.68, "learning_rate": 1.2017333831550485e-06, "loss": 1.1778, "step": 22692 }, { "epoch": 0.68, "learning_rate": 1.2015249381947614e-06, "loss": 1.2859, "step": 22693 }, { "epoch": 0.68, "learning_rate": 1.2013165055953313e-06, "loss": 0.9488, "step": 22694 }, { "epoch": 0.68, "learning_rate": 1.2011080853587426e-06, "loss": 1.0458, "step": 22695 }, { "epoch": 0.68, "learning_rate": 1.2008996774869794e-06, "loss": 1.0501, "step": 22696 }, { "epoch": 0.68, "learning_rate": 1.2006912819820255e-06, "loss": 1.129, "step": 22697 }, { "epoch": 0.68, "learning_rate": 1.200482898845865e-06, "loss": 1.0911, "step": 22698 }, { "epoch": 0.68, "learning_rate": 1.2002745280804814e-06, "loss": 1.2592, "step": 22699 }, { "epoch": 0.68, "learning_rate": 1.2000661696878593e-06, "loss": 1.1779, "step": 22700 }, { "epoch": 0.68, "learning_rate": 1.1998578236699801e-06, "loss": 1.1556, "step": 22701 }, { "epoch": 0.68, "learning_rate": 1.1996494900288282e-06, "loss": 1.0976, "step": 22702 }, { "epoch": 0.68, "learning_rate": 1.1994411687663873e-06, "loss": 1.1224, "step": 22703 }, { "epoch": 0.68, "learning_rate": 1.1992328598846405e-06, "loss": 0.9883, "step": 22704 }, { "epoch": 0.68, "learning_rate": 1.19902456338557e-06, "loss": 1.1331, "step": 22705 }, { "epoch": 0.68, "learning_rate": 1.198816279271159e-06, "loss": 1.088, "step": 22706 }, { "epoch": 0.68, "learning_rate": 1.19860800754339e-06, "loss": 1.0504, "step": 22707 }, { "epoch": 0.68, "learning_rate": 1.198399748204247e-06, "loss": 1.0273, "step": 22708 }, { "epoch": 0.68, "learning_rate": 1.1981915012557108e-06, "loss": 1.1885, "step": 22709 }, { "epoch": 0.68, "learning_rate": 1.1979832666997643e-06, "loss": 1.1583, "step": 22710 }, { "epoch": 0.68, "learning_rate": 1.1977750445383903e-06, "loss": 1.1072, "step": 22711 }, { "epoch": 0.68, "learning_rate": 1.1975668347735706e-06, "loss": 1.0754, "step": 22712 }, { "epoch": 0.68, "learning_rate": 1.1973586374072881e-06, "loss": 1.1005, "step": 22713 }, { "epoch": 0.68, "learning_rate": 1.1971504524415233e-06, "loss": 1.0003, "step": 22714 }, { "epoch": 0.68, "learning_rate": 1.1969422798782587e-06, "loss": 1.1346, "step": 22715 }, { "epoch": 0.68, "learning_rate": 1.196734119719476e-06, "loss": 1.1511, "step": 22716 }, { "epoch": 0.68, "learning_rate": 1.1965259719671577e-06, "loss": 1.2469, "step": 22717 }, { "epoch": 0.68, "learning_rate": 1.1963178366232833e-06, "loss": 1.1502, "step": 22718 }, { "epoch": 0.68, "learning_rate": 1.1961097136898353e-06, "loss": 1.0547, "step": 22719 }, { "epoch": 0.68, "learning_rate": 1.195901603168795e-06, "loss": 1.1226, "step": 22720 }, { "epoch": 0.68, "learning_rate": 1.1956935050621433e-06, "loss": 1.041, "step": 22721 }, { "epoch": 0.68, "learning_rate": 1.1954854193718612e-06, "loss": 1.0456, "step": 22722 }, { "epoch": 0.68, "learning_rate": 1.1952773460999298e-06, "loss": 1.0991, "step": 22723 }, { "epoch": 0.68, "learning_rate": 1.1950692852483296e-06, "loss": 1.066, "step": 22724 }, { "epoch": 0.68, "learning_rate": 1.1948612368190412e-06, "loss": 1.1817, "step": 22725 }, { "epoch": 0.68, "learning_rate": 1.1946532008140463e-06, "loss": 1.2335, "step": 22726 }, { "epoch": 0.68, "learning_rate": 1.1944451772353234e-06, "loss": 1.0917, "step": 22727 }, { "epoch": 0.68, "learning_rate": 1.1942371660848535e-06, "loss": 1.0294, "step": 22728 }, { "epoch": 0.68, "learning_rate": 1.1940291673646167e-06, "loss": 1.0955, "step": 22729 }, { "epoch": 0.68, "learning_rate": 1.1938211810765946e-06, "loss": 1.1788, "step": 22730 }, { "epoch": 0.68, "learning_rate": 1.1936132072227644e-06, "loss": 1.0948, "step": 22731 }, { "epoch": 0.68, "learning_rate": 1.1934052458051077e-06, "loss": 1.1132, "step": 22732 }, { "epoch": 0.68, "learning_rate": 1.1931972968256037e-06, "loss": 1.0948, "step": 22733 }, { "epoch": 0.68, "learning_rate": 1.1929893602862328e-06, "loss": 1.0032, "step": 22734 }, { "epoch": 0.68, "learning_rate": 1.1927814361889729e-06, "loss": 1.1658, "step": 22735 }, { "epoch": 0.68, "learning_rate": 1.1925735245358042e-06, "loss": 1.0764, "step": 22736 }, { "epoch": 0.68, "learning_rate": 1.1923656253287059e-06, "loss": 1.1717, "step": 22737 }, { "epoch": 0.68, "learning_rate": 1.1921577385696568e-06, "loss": 1.1375, "step": 22738 }, { "epoch": 0.69, "learning_rate": 1.1919498642606373e-06, "loss": 1.0782, "step": 22739 }, { "epoch": 0.69, "learning_rate": 1.1917420024036242e-06, "loss": 1.1255, "step": 22740 }, { "epoch": 0.69, "learning_rate": 1.191534153000597e-06, "loss": 1.0474, "step": 22741 }, { "epoch": 0.69, "learning_rate": 1.1913263160535347e-06, "loss": 1.1663, "step": 22742 }, { "epoch": 0.69, "learning_rate": 1.1911184915644161e-06, "loss": 1.1495, "step": 22743 }, { "epoch": 0.69, "learning_rate": 1.1909106795352185e-06, "loss": 1.1445, "step": 22744 }, { "epoch": 0.69, "learning_rate": 1.1907028799679207e-06, "loss": 1.1182, "step": 22745 }, { "epoch": 0.69, "learning_rate": 1.190495092864501e-06, "loss": 1.0958, "step": 22746 }, { "epoch": 0.69, "learning_rate": 1.1902873182269373e-06, "loss": 1.0993, "step": 22747 }, { "epoch": 0.69, "learning_rate": 1.1900795560572084e-06, "loss": 1.078, "step": 22748 }, { "epoch": 0.69, "learning_rate": 1.1898718063572904e-06, "loss": 1.1324, "step": 22749 }, { "epoch": 0.69, "learning_rate": 1.1896640691291617e-06, "loss": 1.2276, "step": 22750 }, { "epoch": 0.69, "learning_rate": 1.1894563443748e-06, "loss": 1.0733, "step": 22751 }, { "epoch": 0.69, "learning_rate": 1.189248632096183e-06, "loss": 1.1494, "step": 22752 }, { "epoch": 0.69, "learning_rate": 1.1890409322952873e-06, "loss": 1.2439, "step": 22753 }, { "epoch": 0.69, "learning_rate": 1.188833244974091e-06, "loss": 1.1057, "step": 22754 }, { "epoch": 0.69, "learning_rate": 1.1886255701345704e-06, "loss": 1.1936, "step": 22755 }, { "epoch": 0.69, "learning_rate": 1.1884179077787036e-06, "loss": 1.0578, "step": 22756 }, { "epoch": 0.69, "learning_rate": 1.188210257908466e-06, "loss": 1.1356, "step": 22757 }, { "epoch": 0.69, "learning_rate": 1.188002620525835e-06, "loss": 1.1982, "step": 22758 }, { "epoch": 0.69, "learning_rate": 1.187794995632787e-06, "loss": 0.9805, "step": 22759 }, { "epoch": 0.69, "learning_rate": 1.1875873832312994e-06, "loss": 1.2053, "step": 22760 }, { "epoch": 0.69, "learning_rate": 1.1873797833233475e-06, "loss": 1.2534, "step": 22761 }, { "epoch": 0.69, "learning_rate": 1.1871721959109076e-06, "loss": 1.2576, "step": 22762 }, { "epoch": 0.69, "learning_rate": 1.186964620995956e-06, "loss": 1.067, "step": 22763 }, { "epoch": 0.69, "learning_rate": 1.1867570585804688e-06, "loss": 1.1039, "step": 22764 }, { "epoch": 0.69, "learning_rate": 1.186549508666423e-06, "loss": 1.1456, "step": 22765 }, { "epoch": 0.69, "learning_rate": 1.1863419712557922e-06, "loss": 1.0478, "step": 22766 }, { "epoch": 0.69, "learning_rate": 1.1861344463505535e-06, "loss": 1.0858, "step": 22767 }, { "epoch": 0.69, "learning_rate": 1.1859269339526816e-06, "loss": 1.1856, "step": 22768 }, { "epoch": 0.69, "learning_rate": 1.1857194340641538e-06, "loss": 1.2029, "step": 22769 }, { "epoch": 0.69, "learning_rate": 1.1855119466869427e-06, "loss": 1.1698, "step": 22770 }, { "epoch": 0.69, "learning_rate": 1.185304471823025e-06, "loss": 1.0986, "step": 22771 }, { "epoch": 0.69, "learning_rate": 1.1850970094743754e-06, "loss": 1.1597, "step": 22772 }, { "epoch": 0.69, "learning_rate": 1.18488955964297e-06, "loss": 1.1553, "step": 22773 }, { "epoch": 0.69, "learning_rate": 1.1846821223307816e-06, "loss": 1.038, "step": 22774 }, { "epoch": 0.69, "learning_rate": 1.1844746975397862e-06, "loss": 1.1433, "step": 22775 }, { "epoch": 0.69, "learning_rate": 1.1842672852719578e-06, "loss": 1.0987, "step": 22776 }, { "epoch": 0.69, "learning_rate": 1.1840598855292714e-06, "loss": 1.0115, "step": 22777 }, { "epoch": 0.69, "learning_rate": 1.1838524983137008e-06, "loss": 1.1685, "step": 22778 }, { "epoch": 0.69, "learning_rate": 1.183645123627221e-06, "loss": 1.0822, "step": 22779 }, { "epoch": 0.69, "learning_rate": 1.1834377614718054e-06, "loss": 1.1786, "step": 22780 }, { "epoch": 0.69, "learning_rate": 1.1832304118494282e-06, "loss": 1.1385, "step": 22781 }, { "epoch": 0.69, "learning_rate": 1.183023074762064e-06, "loss": 1.0818, "step": 22782 }, { "epoch": 0.69, "learning_rate": 1.1828157502116855e-06, "loss": 1.0616, "step": 22783 }, { "epoch": 0.69, "learning_rate": 1.1826084382002661e-06, "loss": 1.1642, "step": 22784 }, { "epoch": 0.69, "learning_rate": 1.18240113872978e-06, "loss": 1.0632, "step": 22785 }, { "epoch": 0.69, "learning_rate": 1.182193851802202e-06, "loss": 1.1525, "step": 22786 }, { "epoch": 0.69, "learning_rate": 1.1819865774195022e-06, "loss": 1.1597, "step": 22787 }, { "epoch": 0.69, "learning_rate": 1.1817793155836558e-06, "loss": 1.1375, "step": 22788 }, { "epoch": 0.69, "learning_rate": 1.1815720662966353e-06, "loss": 1.1437, "step": 22789 }, { "epoch": 0.69, "learning_rate": 1.1813648295604138e-06, "loss": 1.0305, "step": 22790 }, { "epoch": 0.69, "learning_rate": 1.1811576053769649e-06, "loss": 1.0784, "step": 22791 }, { "epoch": 0.69, "learning_rate": 1.1809503937482595e-06, "loss": 1.0317, "step": 22792 }, { "epoch": 0.69, "learning_rate": 1.1807431946762713e-06, "loss": 1.1945, "step": 22793 }, { "epoch": 0.69, "learning_rate": 1.1805360081629722e-06, "loss": 1.1537, "step": 22794 }, { "epoch": 0.69, "learning_rate": 1.1803288342103358e-06, "loss": 1.0803, "step": 22795 }, { "epoch": 0.69, "learning_rate": 1.1801216728203323e-06, "loss": 1.0811, "step": 22796 }, { "epoch": 0.69, "learning_rate": 1.1799145239949353e-06, "loss": 1.1616, "step": 22797 }, { "epoch": 0.69, "learning_rate": 1.179707387736116e-06, "loss": 1.1398, "step": 22798 }, { "epoch": 0.69, "learning_rate": 1.1795002640458471e-06, "loss": 1.0967, "step": 22799 }, { "epoch": 0.69, "learning_rate": 1.1792931529260993e-06, "loss": 1.1126, "step": 22800 }, { "epoch": 0.69, "learning_rate": 1.179086054378844e-06, "loss": 1.0954, "step": 22801 }, { "epoch": 0.69, "learning_rate": 1.1788789684060538e-06, "loss": 1.1449, "step": 22802 }, { "epoch": 0.69, "learning_rate": 1.1786718950096992e-06, "loss": 1.1887, "step": 22803 }, { "epoch": 0.69, "learning_rate": 1.178464834191752e-06, "loss": 1.1902, "step": 22804 }, { "epoch": 0.69, "learning_rate": 1.1782577859541833e-06, "loss": 1.1461, "step": 22805 }, { "epoch": 0.69, "learning_rate": 1.1780507502989635e-06, "loss": 1.0521, "step": 22806 }, { "epoch": 0.69, "learning_rate": 1.1778437272280641e-06, "loss": 1.1047, "step": 22807 }, { "epoch": 0.69, "learning_rate": 1.1776367167434566e-06, "loss": 1.1016, "step": 22808 }, { "epoch": 0.69, "learning_rate": 1.1774297188471096e-06, "loss": 1.1461, "step": 22809 }, { "epoch": 0.69, "learning_rate": 1.177222733540995e-06, "loss": 1.0208, "step": 22810 }, { "epoch": 0.69, "learning_rate": 1.1770157608270827e-06, "loss": 1.1963, "step": 22811 }, { "epoch": 0.69, "learning_rate": 1.176808800707344e-06, "loss": 1.1604, "step": 22812 }, { "epoch": 0.69, "learning_rate": 1.1766018531837476e-06, "loss": 1.134, "step": 22813 }, { "epoch": 0.69, "learning_rate": 1.1763949182582638e-06, "loss": 1.1664, "step": 22814 }, { "epoch": 0.69, "learning_rate": 1.1761879959328633e-06, "loss": 1.0682, "step": 22815 }, { "epoch": 0.69, "learning_rate": 1.1759810862095162e-06, "loss": 1.1165, "step": 22816 }, { "epoch": 0.69, "learning_rate": 1.1757741890901905e-06, "loss": 1.097, "step": 22817 }, { "epoch": 0.69, "learning_rate": 1.175567304576857e-06, "loss": 1.0695, "step": 22818 }, { "epoch": 0.69, "learning_rate": 1.1753604326714848e-06, "loss": 0.9506, "step": 22819 }, { "epoch": 0.69, "learning_rate": 1.1751535733760433e-06, "loss": 1.1279, "step": 22820 }, { "epoch": 0.69, "learning_rate": 1.1749467266925024e-06, "loss": 1.0765, "step": 22821 }, { "epoch": 0.69, "learning_rate": 1.17473989262283e-06, "loss": 1.0156, "step": 22822 }, { "epoch": 0.69, "learning_rate": 1.1745330711689953e-06, "loss": 1.0015, "step": 22823 }, { "epoch": 0.69, "learning_rate": 1.1743262623329673e-06, "loss": 1.0552, "step": 22824 }, { "epoch": 0.69, "learning_rate": 1.174119466116716e-06, "loss": 1.1899, "step": 22825 }, { "epoch": 0.69, "learning_rate": 1.1739126825222078e-06, "loss": 1.1135, "step": 22826 }, { "epoch": 0.69, "learning_rate": 1.1737059115514121e-06, "loss": 1.0741, "step": 22827 }, { "epoch": 0.69, "learning_rate": 1.1734991532062975e-06, "loss": 1.007, "step": 22828 }, { "epoch": 0.69, "learning_rate": 1.173292407488832e-06, "loss": 1.1264, "step": 22829 }, { "epoch": 0.69, "learning_rate": 1.1730856744009847e-06, "loss": 1.0992, "step": 22830 }, { "epoch": 0.69, "learning_rate": 1.172878953944722e-06, "loss": 1.0482, "step": 22831 }, { "epoch": 0.69, "learning_rate": 1.1726722461220123e-06, "loss": 1.1371, "step": 22832 }, { "epoch": 0.69, "learning_rate": 1.1724655509348236e-06, "loss": 1.0203, "step": 22833 }, { "epoch": 0.69, "learning_rate": 1.1722588683851235e-06, "loss": 1.0729, "step": 22834 }, { "epoch": 0.69, "learning_rate": 1.1720521984748795e-06, "loss": 0.9952, "step": 22835 }, { "epoch": 0.69, "learning_rate": 1.1718455412060588e-06, "loss": 1.0952, "step": 22836 }, { "epoch": 0.69, "learning_rate": 1.1716388965806294e-06, "loss": 1.0676, "step": 22837 }, { "epoch": 0.69, "learning_rate": 1.1714322646005585e-06, "loss": 0.9958, "step": 22838 }, { "epoch": 0.69, "learning_rate": 1.1712256452678118e-06, "loss": 1.1155, "step": 22839 }, { "epoch": 0.69, "learning_rate": 1.171019038584357e-06, "loss": 1.1099, "step": 22840 }, { "epoch": 0.69, "learning_rate": 1.1708124445521608e-06, "loss": 1.0485, "step": 22841 }, { "epoch": 0.69, "learning_rate": 1.170605863173191e-06, "loss": 1.0911, "step": 22842 }, { "epoch": 0.69, "learning_rate": 1.170399294449412e-06, "loss": 1.1838, "step": 22843 }, { "epoch": 0.69, "learning_rate": 1.1701927383827913e-06, "loss": 1.1445, "step": 22844 }, { "epoch": 0.69, "learning_rate": 1.1699861949752955e-06, "loss": 1.0352, "step": 22845 }, { "epoch": 0.69, "learning_rate": 1.1697796642288905e-06, "loss": 1.1772, "step": 22846 }, { "epoch": 0.69, "learning_rate": 1.1695731461455433e-06, "loss": 0.9816, "step": 22847 }, { "epoch": 0.69, "learning_rate": 1.1693666407272183e-06, "loss": 1.1833, "step": 22848 }, { "epoch": 0.69, "learning_rate": 1.1691601479758818e-06, "loss": 1.1541, "step": 22849 }, { "epoch": 0.69, "learning_rate": 1.1689536678934998e-06, "loss": 1.1066, "step": 22850 }, { "epoch": 0.69, "learning_rate": 1.1687472004820389e-06, "loss": 1.1317, "step": 22851 }, { "epoch": 0.69, "learning_rate": 1.1685407457434624e-06, "loss": 1.0861, "step": 22852 }, { "epoch": 0.69, "learning_rate": 1.1683343036797369e-06, "loss": 1.1577, "step": 22853 }, { "epoch": 0.69, "learning_rate": 1.1681278742928273e-06, "loss": 1.0695, "step": 22854 }, { "epoch": 0.69, "learning_rate": 1.1679214575846997e-06, "loss": 1.1675, "step": 22855 }, { "epoch": 0.69, "learning_rate": 1.1677150535573175e-06, "loss": 1.1644, "step": 22856 }, { "epoch": 0.69, "learning_rate": 1.1675086622126463e-06, "loss": 1.1314, "step": 22857 }, { "epoch": 0.69, "learning_rate": 1.1673022835526513e-06, "loss": 1.0789, "step": 22858 }, { "epoch": 0.69, "learning_rate": 1.1670959175792961e-06, "loss": 1.0992, "step": 22859 }, { "epoch": 0.69, "learning_rate": 1.166889564294546e-06, "loss": 1.0263, "step": 22860 }, { "epoch": 0.69, "learning_rate": 1.1666832237003654e-06, "loss": 1.0505, "step": 22861 }, { "epoch": 0.69, "learning_rate": 1.1664768957987183e-06, "loss": 1.1785, "step": 22862 }, { "epoch": 0.69, "learning_rate": 1.1662705805915688e-06, "loss": 1.0811, "step": 22863 }, { "epoch": 0.69, "learning_rate": 1.166064278080882e-06, "loss": 1.0875, "step": 22864 }, { "epoch": 0.69, "learning_rate": 1.16585798826862e-06, "loss": 0.9502, "step": 22865 }, { "epoch": 0.69, "learning_rate": 1.1656517111567472e-06, "loss": 1.0627, "step": 22866 }, { "epoch": 0.69, "learning_rate": 1.1654454467472277e-06, "loss": 1.042, "step": 22867 }, { "epoch": 0.69, "learning_rate": 1.1652391950420256e-06, "loss": 1.2622, "step": 22868 }, { "epoch": 0.69, "learning_rate": 1.1650329560431025e-06, "loss": 1.14, "step": 22869 }, { "epoch": 0.69, "learning_rate": 1.1648267297524227e-06, "loss": 1.098, "step": 22870 }, { "epoch": 0.69, "learning_rate": 1.1646205161719495e-06, "loss": 1.0938, "step": 22871 }, { "epoch": 0.69, "learning_rate": 1.1644143153036458e-06, "loss": 1.161, "step": 22872 }, { "epoch": 0.69, "learning_rate": 1.1642081271494756e-06, "loss": 1.0561, "step": 22873 }, { "epoch": 0.69, "learning_rate": 1.1640019517113999e-06, "loss": 1.1576, "step": 22874 }, { "epoch": 0.69, "learning_rate": 1.1637957889913817e-06, "loss": 1.1489, "step": 22875 }, { "epoch": 0.69, "learning_rate": 1.1635896389913846e-06, "loss": 1.106, "step": 22876 }, { "epoch": 0.69, "learning_rate": 1.163383501713371e-06, "loss": 1.078, "step": 22877 }, { "epoch": 0.69, "learning_rate": 1.1631773771593018e-06, "loss": 1.1799, "step": 22878 }, { "epoch": 0.69, "learning_rate": 1.1629712653311407e-06, "loss": 1.0885, "step": 22879 }, { "epoch": 0.69, "learning_rate": 1.1627651662308486e-06, "loss": 1.085, "step": 22880 }, { "epoch": 0.69, "learning_rate": 1.1625590798603892e-06, "loss": 1.1652, "step": 22881 }, { "epoch": 0.69, "learning_rate": 1.1623530062217226e-06, "loss": 1.0786, "step": 22882 }, { "epoch": 0.69, "learning_rate": 1.1621469453168109e-06, "loss": 1.0388, "step": 22883 }, { "epoch": 0.69, "learning_rate": 1.1619408971476157e-06, "loss": 1.0556, "step": 22884 }, { "epoch": 0.69, "learning_rate": 1.161734861716099e-06, "loss": 1.187, "step": 22885 }, { "epoch": 0.69, "learning_rate": 1.1615288390242219e-06, "loss": 1.1633, "step": 22886 }, { "epoch": 0.69, "learning_rate": 1.1613228290739453e-06, "loss": 0.9442, "step": 22887 }, { "epoch": 0.69, "learning_rate": 1.161116831867231e-06, "loss": 1.0792, "step": 22888 }, { "epoch": 0.69, "learning_rate": 1.1609108474060397e-06, "loss": 1.2335, "step": 22889 }, { "epoch": 0.69, "learning_rate": 1.1607048756923327e-06, "loss": 1.0561, "step": 22890 }, { "epoch": 0.69, "learning_rate": 1.1604989167280697e-06, "loss": 1.1212, "step": 22891 }, { "epoch": 0.69, "learning_rate": 1.1602929705152119e-06, "loss": 1.069, "step": 22892 }, { "epoch": 0.69, "learning_rate": 1.1600870370557195e-06, "loss": 1.1091, "step": 22893 }, { "epoch": 0.69, "learning_rate": 1.1598811163515545e-06, "loss": 1.0748, "step": 22894 }, { "epoch": 0.69, "learning_rate": 1.1596752084046748e-06, "loss": 1.0406, "step": 22895 }, { "epoch": 0.69, "learning_rate": 1.1594693132170412e-06, "loss": 1.1666, "step": 22896 }, { "epoch": 0.69, "learning_rate": 1.1592634307906146e-06, "loss": 1.0816, "step": 22897 }, { "epoch": 0.69, "learning_rate": 1.159057561127354e-06, "loss": 1.2244, "step": 22898 }, { "epoch": 0.69, "learning_rate": 1.158851704229221e-06, "loss": 1.0737, "step": 22899 }, { "epoch": 0.69, "learning_rate": 1.1586458600981725e-06, "loss": 0.9539, "step": 22900 }, { "epoch": 0.69, "learning_rate": 1.1584400287361696e-06, "loss": 1.1066, "step": 22901 }, { "epoch": 0.69, "learning_rate": 1.1582342101451715e-06, "loss": 1.023, "step": 22902 }, { "epoch": 0.69, "learning_rate": 1.1580284043271386e-06, "loss": 1.1501, "step": 22903 }, { "epoch": 0.69, "learning_rate": 1.1578226112840279e-06, "loss": 1.161, "step": 22904 }, { "epoch": 0.69, "learning_rate": 1.1576168310177992e-06, "loss": 1.166, "step": 22905 }, { "epoch": 0.69, "learning_rate": 1.1574110635304122e-06, "loss": 1.2509, "step": 22906 }, { "epoch": 0.69, "learning_rate": 1.157205308823826e-06, "loss": 1.0634, "step": 22907 }, { "epoch": 0.69, "learning_rate": 1.1569995668999977e-06, "loss": 1.1476, "step": 22908 }, { "epoch": 0.69, "learning_rate": 1.1567938377608868e-06, "loss": 1.0925, "step": 22909 }, { "epoch": 0.69, "learning_rate": 1.1565881214084514e-06, "loss": 1.0896, "step": 22910 }, { "epoch": 0.69, "learning_rate": 1.1563824178446504e-06, "loss": 1.1472, "step": 22911 }, { "epoch": 0.69, "learning_rate": 1.1561767270714424e-06, "loss": 1.059, "step": 22912 }, { "epoch": 0.69, "learning_rate": 1.1559710490907839e-06, "loss": 1.1555, "step": 22913 }, { "epoch": 0.69, "learning_rate": 1.1557653839046334e-06, "loss": 1.1237, "step": 22914 }, { "epoch": 0.69, "learning_rate": 1.1555597315149494e-06, "loss": 1.1214, "step": 22915 }, { "epoch": 0.69, "learning_rate": 1.1553540919236892e-06, "loss": 1.0948, "step": 22916 }, { "epoch": 0.69, "learning_rate": 1.1551484651328102e-06, "loss": 1.0657, "step": 22917 }, { "epoch": 0.69, "learning_rate": 1.1549428511442703e-06, "loss": 1.0936, "step": 22918 }, { "epoch": 0.69, "learning_rate": 1.1547372499600268e-06, "loss": 1.1206, "step": 22919 }, { "epoch": 0.69, "learning_rate": 1.1545316615820373e-06, "loss": 1.1166, "step": 22920 }, { "epoch": 0.69, "learning_rate": 1.154326086012258e-06, "loss": 1.1169, "step": 22921 }, { "epoch": 0.69, "learning_rate": 1.1541205232526457e-06, "loss": 1.1953, "step": 22922 }, { "epoch": 0.69, "learning_rate": 1.153914973305158e-06, "loss": 1.2251, "step": 22923 }, { "epoch": 0.69, "learning_rate": 1.1537094361717516e-06, "loss": 1.0798, "step": 22924 }, { "epoch": 0.69, "learning_rate": 1.1535039118543839e-06, "loss": 1.1884, "step": 22925 }, { "epoch": 0.69, "learning_rate": 1.1532984003550092e-06, "loss": 1.0313, "step": 22926 }, { "epoch": 0.69, "learning_rate": 1.1530929016755856e-06, "loss": 1.1276, "step": 22927 }, { "epoch": 0.69, "learning_rate": 1.1528874158180689e-06, "loss": 1.1467, "step": 22928 }, { "epoch": 0.69, "learning_rate": 1.1526819427844157e-06, "loss": 1.2216, "step": 22929 }, { "epoch": 0.69, "learning_rate": 1.1524764825765808e-06, "loss": 1.0931, "step": 22930 }, { "epoch": 0.69, "learning_rate": 1.1522710351965208e-06, "loss": 1.1932, "step": 22931 }, { "epoch": 0.69, "learning_rate": 1.1520656006461916e-06, "loss": 1.1066, "step": 22932 }, { "epoch": 0.69, "learning_rate": 1.1518601789275495e-06, "loss": 1.1347, "step": 22933 }, { "epoch": 0.69, "learning_rate": 1.1516547700425481e-06, "loss": 1.196, "step": 22934 }, { "epoch": 0.69, "learning_rate": 1.1514493739931442e-06, "loss": 0.9997, "step": 22935 }, { "epoch": 0.69, "learning_rate": 1.1512439907812928e-06, "loss": 1.1879, "step": 22936 }, { "epoch": 0.69, "learning_rate": 1.1510386204089488e-06, "loss": 1.2079, "step": 22937 }, { "epoch": 0.69, "learning_rate": 1.1508332628780683e-06, "loss": 1.2489, "step": 22938 }, { "epoch": 0.69, "learning_rate": 1.1506279181906047e-06, "loss": 1.1155, "step": 22939 }, { "epoch": 0.69, "learning_rate": 1.1504225863485132e-06, "loss": 1.0795, "step": 22940 }, { "epoch": 0.69, "learning_rate": 1.150217267353749e-06, "loss": 1.1756, "step": 22941 }, { "epoch": 0.69, "learning_rate": 1.150011961208266e-06, "loss": 1.2043, "step": 22942 }, { "epoch": 0.69, "learning_rate": 1.149806667914019e-06, "loss": 1.0837, "step": 22943 }, { "epoch": 0.69, "learning_rate": 1.1496013874729625e-06, "loss": 1.1207, "step": 22944 }, { "epoch": 0.69, "learning_rate": 1.1493961198870503e-06, "loss": 1.0466, "step": 22945 }, { "epoch": 0.69, "learning_rate": 1.1491908651582376e-06, "loss": 1.1177, "step": 22946 }, { "epoch": 0.69, "learning_rate": 1.148985623288476e-06, "loss": 1.103, "step": 22947 }, { "epoch": 0.69, "learning_rate": 1.148780394279721e-06, "loss": 1.2353, "step": 22948 }, { "epoch": 0.69, "learning_rate": 1.1485751781339255e-06, "loss": 1.1874, "step": 22949 }, { "epoch": 0.69, "learning_rate": 1.148369974853044e-06, "loss": 1.1366, "step": 22950 }, { "epoch": 0.69, "learning_rate": 1.1481647844390297e-06, "loss": 0.9914, "step": 22951 }, { "epoch": 0.69, "learning_rate": 1.1479596068938348e-06, "loss": 1.081, "step": 22952 }, { "epoch": 0.69, "learning_rate": 1.1477544422194135e-06, "loss": 1.0642, "step": 22953 }, { "epoch": 0.69, "learning_rate": 1.1475492904177184e-06, "loss": 1.0871, "step": 22954 }, { "epoch": 0.69, "learning_rate": 1.1473441514907037e-06, "loss": 1.0704, "step": 22955 }, { "epoch": 0.69, "learning_rate": 1.1471390254403205e-06, "loss": 1.1575, "step": 22956 }, { "epoch": 0.69, "learning_rate": 1.146933912268522e-06, "loss": 1.1195, "step": 22957 }, { "epoch": 0.69, "learning_rate": 1.146728811977261e-06, "loss": 1.0294, "step": 22958 }, { "epoch": 0.69, "learning_rate": 1.146523724568491e-06, "loss": 1.0947, "step": 22959 }, { "epoch": 0.69, "learning_rate": 1.1463186500441622e-06, "loss": 1.1874, "step": 22960 }, { "epoch": 0.69, "learning_rate": 1.146113588406228e-06, "loss": 1.1481, "step": 22961 }, { "epoch": 0.69, "learning_rate": 1.1459085396566406e-06, "loss": 1.046, "step": 22962 }, { "epoch": 0.69, "learning_rate": 1.1457035037973513e-06, "loss": 1.2051, "step": 22963 }, { "epoch": 0.69, "learning_rate": 1.1454984808303134e-06, "loss": 1.0955, "step": 22964 }, { "epoch": 0.69, "learning_rate": 1.1452934707574769e-06, "loss": 1.0308, "step": 22965 }, { "epoch": 0.69, "learning_rate": 1.145088473580794e-06, "loss": 1.1433, "step": 22966 }, { "epoch": 0.69, "learning_rate": 1.1448834893022165e-06, "loss": 1.0662, "step": 22967 }, { "epoch": 0.69, "learning_rate": 1.1446785179236953e-06, "loss": 0.9879, "step": 22968 }, { "epoch": 0.69, "learning_rate": 1.1444735594471816e-06, "loss": 1.0497, "step": 22969 }, { "epoch": 0.69, "learning_rate": 1.1442686138746273e-06, "loss": 1.1567, "step": 22970 }, { "epoch": 0.69, "learning_rate": 1.1440636812079824e-06, "loss": 1.0672, "step": 22971 }, { "epoch": 0.69, "learning_rate": 1.1438587614491998e-06, "loss": 1.1052, "step": 22972 }, { "epoch": 0.69, "learning_rate": 1.143653854600227e-06, "loss": 1.0743, "step": 22973 }, { "epoch": 0.69, "learning_rate": 1.1434489606630166e-06, "loss": 1.1331, "step": 22974 }, { "epoch": 0.69, "learning_rate": 1.1432440796395188e-06, "loss": 1.1921, "step": 22975 }, { "epoch": 0.69, "learning_rate": 1.1430392115316838e-06, "loss": 1.1365, "step": 22976 }, { "epoch": 0.69, "learning_rate": 1.142834356341463e-06, "loss": 1.0661, "step": 22977 }, { "epoch": 0.69, "learning_rate": 1.1426295140708043e-06, "loss": 1.0911, "step": 22978 }, { "epoch": 0.69, "learning_rate": 1.1424246847216594e-06, "loss": 1.1481, "step": 22979 }, { "epoch": 0.69, "learning_rate": 1.1422198682959774e-06, "loss": 1.1467, "step": 22980 }, { "epoch": 0.69, "learning_rate": 1.142015064795709e-06, "loss": 1.2308, "step": 22981 }, { "epoch": 0.69, "learning_rate": 1.1418102742228027e-06, "loss": 1.034, "step": 22982 }, { "epoch": 0.69, "learning_rate": 1.1416054965792082e-06, "loss": 1.006, "step": 22983 }, { "epoch": 0.69, "learning_rate": 1.141400731866875e-06, "loss": 1.1009, "step": 22984 }, { "epoch": 0.69, "learning_rate": 1.1411959800877537e-06, "loss": 1.1344, "step": 22985 }, { "epoch": 0.69, "learning_rate": 1.1409912412437912e-06, "loss": 1.1, "step": 22986 }, { "epoch": 0.69, "learning_rate": 1.1407865153369375e-06, "loss": 1.1772, "step": 22987 }, { "epoch": 0.69, "learning_rate": 1.1405818023691418e-06, "loss": 1.1681, "step": 22988 }, { "epoch": 0.69, "learning_rate": 1.1403771023423532e-06, "loss": 1.177, "step": 22989 }, { "epoch": 0.69, "learning_rate": 1.1401724152585192e-06, "loss": 1.0966, "step": 22990 }, { "epoch": 0.69, "learning_rate": 1.1399677411195886e-06, "loss": 1.0953, "step": 22991 }, { "epoch": 0.69, "learning_rate": 1.1397630799275103e-06, "loss": 1.0842, "step": 22992 }, { "epoch": 0.69, "learning_rate": 1.1395584316842323e-06, "loss": 1.0497, "step": 22993 }, { "epoch": 0.69, "learning_rate": 1.1393537963917025e-06, "loss": 1.1013, "step": 22994 }, { "epoch": 0.69, "learning_rate": 1.1391491740518707e-06, "loss": 0.9703, "step": 22995 }, { "epoch": 0.69, "learning_rate": 1.1389445646666822e-06, "loss": 1.0293, "step": 22996 }, { "epoch": 0.69, "learning_rate": 1.1387399682380859e-06, "loss": 1.0226, "step": 22997 }, { "epoch": 0.69, "learning_rate": 1.1385353847680294e-06, "loss": 1.2046, "step": 22998 }, { "epoch": 0.69, "learning_rate": 1.1383308142584606e-06, "loss": 1.1976, "step": 22999 }, { "epoch": 0.69, "learning_rate": 1.1381262567113265e-06, "loss": 1.1415, "step": 23000 }, { "epoch": 0.69, "learning_rate": 1.1379217121285747e-06, "loss": 1.1353, "step": 23001 }, { "epoch": 0.69, "learning_rate": 1.137717180512153e-06, "loss": 1.155, "step": 23002 }, { "epoch": 0.69, "learning_rate": 1.1375126618640064e-06, "loss": 1.0698, "step": 23003 }, { "epoch": 0.69, "learning_rate": 1.1373081561860834e-06, "loss": 1.164, "step": 23004 }, { "epoch": 0.69, "learning_rate": 1.1371036634803307e-06, "loss": 1.0325, "step": 23005 }, { "epoch": 0.69, "learning_rate": 1.1368991837486943e-06, "loss": 0.8745, "step": 23006 }, { "epoch": 0.69, "learning_rate": 1.1366947169931222e-06, "loss": 1.0761, "step": 23007 }, { "epoch": 0.69, "learning_rate": 1.1364902632155589e-06, "loss": 1.0606, "step": 23008 }, { "epoch": 0.69, "learning_rate": 1.1362858224179515e-06, "loss": 1.1002, "step": 23009 }, { "epoch": 0.69, "learning_rate": 1.1360813946022466e-06, "loss": 1.1667, "step": 23010 }, { "epoch": 0.69, "learning_rate": 1.1358769797703905e-06, "loss": 1.1119, "step": 23011 }, { "epoch": 0.69, "learning_rate": 1.135672577924328e-06, "loss": 1.0714, "step": 23012 }, { "epoch": 0.69, "learning_rate": 1.1354681890660051e-06, "loss": 1.2311, "step": 23013 }, { "epoch": 0.69, "learning_rate": 1.135263813197368e-06, "loss": 1.1195, "step": 23014 }, { "epoch": 0.69, "learning_rate": 1.1350594503203633e-06, "loss": 1.0573, "step": 23015 }, { "epoch": 0.69, "learning_rate": 1.134855100436934e-06, "loss": 1.022, "step": 23016 }, { "epoch": 0.69, "learning_rate": 1.134650763549027e-06, "loss": 1.1255, "step": 23017 }, { "epoch": 0.69, "learning_rate": 1.1344464396585869e-06, "loss": 1.1968, "step": 23018 }, { "epoch": 0.69, "learning_rate": 1.134242128767559e-06, "loss": 1.1351, "step": 23019 }, { "epoch": 0.69, "learning_rate": 1.1340378308778894e-06, "loss": 1.0957, "step": 23020 }, { "epoch": 0.69, "learning_rate": 1.1338335459915205e-06, "loss": 1.0001, "step": 23021 }, { "epoch": 0.69, "learning_rate": 1.1336292741103986e-06, "loss": 1.0195, "step": 23022 }, { "epoch": 0.69, "learning_rate": 1.133425015236468e-06, "loss": 1.0854, "step": 23023 }, { "epoch": 0.69, "learning_rate": 1.1332207693716728e-06, "loss": 1.2017, "step": 23024 }, { "epoch": 0.69, "learning_rate": 1.1330165365179577e-06, "loss": 1.2117, "step": 23025 }, { "epoch": 0.69, "learning_rate": 1.132812316677267e-06, "loss": 1.1221, "step": 23026 }, { "epoch": 0.69, "learning_rate": 1.1326081098515443e-06, "loss": 1.0789, "step": 23027 }, { "epoch": 0.69, "learning_rate": 1.132403916042735e-06, "loss": 1.0762, "step": 23028 }, { "epoch": 0.69, "learning_rate": 1.1321997352527806e-06, "loss": 1.2052, "step": 23029 }, { "epoch": 0.69, "learning_rate": 1.1319955674836262e-06, "loss": 1.2523, "step": 23030 }, { "epoch": 0.69, "learning_rate": 1.131791412737215e-06, "loss": 1.1703, "step": 23031 }, { "epoch": 0.69, "learning_rate": 1.1315872710154907e-06, "loss": 1.139, "step": 23032 }, { "epoch": 0.69, "learning_rate": 1.1313831423203975e-06, "loss": 1.1622, "step": 23033 }, { "epoch": 0.69, "learning_rate": 1.1311790266538764e-06, "loss": 1.1841, "step": 23034 }, { "epoch": 0.69, "learning_rate": 1.130974924017872e-06, "loss": 1.1314, "step": 23035 }, { "epoch": 0.69, "learning_rate": 1.130770834414327e-06, "loss": 1.1492, "step": 23036 }, { "epoch": 0.69, "learning_rate": 1.1305667578451848e-06, "loss": 1.0465, "step": 23037 }, { "epoch": 0.69, "learning_rate": 1.1303626943123868e-06, "loss": 1.2209, "step": 23038 }, { "epoch": 0.69, "learning_rate": 1.1301586438178766e-06, "loss": 1.035, "step": 23039 }, { "epoch": 0.69, "learning_rate": 1.1299546063635962e-06, "loss": 1.1209, "step": 23040 }, { "epoch": 0.69, "learning_rate": 1.1297505819514886e-06, "loss": 1.0679, "step": 23041 }, { "epoch": 0.69, "learning_rate": 1.129546570583495e-06, "loss": 1.1448, "step": 23042 }, { "epoch": 0.69, "learning_rate": 1.129342572261558e-06, "loss": 1.1782, "step": 23043 }, { "epoch": 0.69, "learning_rate": 1.1291385869876198e-06, "loss": 0.9553, "step": 23044 }, { "epoch": 0.69, "learning_rate": 1.1289346147636215e-06, "loss": 1.0898, "step": 23045 }, { "epoch": 0.69, "learning_rate": 1.1287306555915068e-06, "loss": 1.1477, "step": 23046 }, { "epoch": 0.69, "learning_rate": 1.1285267094732143e-06, "loss": 1.0404, "step": 23047 }, { "epoch": 0.69, "learning_rate": 1.1283227764106876e-06, "loss": 1.1172, "step": 23048 }, { "epoch": 0.69, "learning_rate": 1.1281188564058673e-06, "loss": 1.0636, "step": 23049 }, { "epoch": 0.69, "learning_rate": 1.1279149494606944e-06, "loss": 1.254, "step": 23050 }, { "epoch": 0.69, "learning_rate": 1.1277110555771109e-06, "loss": 0.9812, "step": 23051 }, { "epoch": 0.69, "learning_rate": 1.1275071747570569e-06, "loss": 1.0583, "step": 23052 }, { "epoch": 0.69, "learning_rate": 1.1273033070024736e-06, "loss": 1.0503, "step": 23053 }, { "epoch": 0.69, "learning_rate": 1.1270994523153026e-06, "loss": 1.1813, "step": 23054 }, { "epoch": 0.69, "learning_rate": 1.1268956106974828e-06, "loss": 1.0862, "step": 23055 }, { "epoch": 0.69, "learning_rate": 1.1266917821509555e-06, "loss": 1.3093, "step": 23056 }, { "epoch": 0.69, "learning_rate": 1.126487966677661e-06, "loss": 1.0377, "step": 23057 }, { "epoch": 0.69, "learning_rate": 1.1262841642795394e-06, "loss": 1.0746, "step": 23058 }, { "epoch": 0.69, "learning_rate": 1.126080374958532e-06, "loss": 1.0325, "step": 23059 }, { "epoch": 0.69, "learning_rate": 1.1258765987165769e-06, "loss": 1.2069, "step": 23060 }, { "epoch": 0.69, "learning_rate": 1.1256728355556146e-06, "loss": 1.0402, "step": 23061 }, { "epoch": 0.69, "learning_rate": 1.125469085477585e-06, "loss": 1.2758, "step": 23062 }, { "epoch": 0.69, "learning_rate": 1.1252653484844287e-06, "loss": 1.1415, "step": 23063 }, { "epoch": 0.69, "learning_rate": 1.1250616245780832e-06, "loss": 1.0547, "step": 23064 }, { "epoch": 0.69, "learning_rate": 1.124857913760489e-06, "loss": 1.0571, "step": 23065 }, { "epoch": 0.69, "learning_rate": 1.124654216033585e-06, "loss": 1.1682, "step": 23066 }, { "epoch": 0.69, "learning_rate": 1.1244505313993115e-06, "loss": 1.117, "step": 23067 }, { "epoch": 0.69, "learning_rate": 1.1242468598596055e-06, "loss": 1.2853, "step": 23068 }, { "epoch": 0.69, "learning_rate": 1.1240432014164068e-06, "loss": 1.1484, "step": 23069 }, { "epoch": 0.69, "learning_rate": 1.1238395560716542e-06, "loss": 1.0284, "step": 23070 }, { "epoch": 0.7, "learning_rate": 1.1236359238272862e-06, "loss": 1.0204, "step": 23071 }, { "epoch": 0.7, "learning_rate": 1.1234323046852422e-06, "loss": 1.0153, "step": 23072 }, { "epoch": 0.7, "learning_rate": 1.1232286986474589e-06, "loss": 1.0853, "step": 23073 }, { "epoch": 0.7, "learning_rate": 1.123025105715875e-06, "loss": 1.1029, "step": 23074 }, { "epoch": 0.7, "learning_rate": 1.1228215258924294e-06, "loss": 1.1163, "step": 23075 }, { "epoch": 0.7, "learning_rate": 1.1226179591790593e-06, "loss": 1.0836, "step": 23076 }, { "epoch": 0.7, "learning_rate": 1.1224144055777037e-06, "loss": 1.1028, "step": 23077 }, { "epoch": 0.7, "learning_rate": 1.1222108650902987e-06, "loss": 1.0689, "step": 23078 }, { "epoch": 0.7, "learning_rate": 1.1220073377187827e-06, "loss": 1.0294, "step": 23079 }, { "epoch": 0.7, "learning_rate": 1.1218038234650933e-06, "loss": 1.101, "step": 23080 }, { "epoch": 0.7, "learning_rate": 1.1216003223311675e-06, "loss": 1.0278, "step": 23081 }, { "epoch": 0.7, "learning_rate": 1.1213968343189428e-06, "loss": 1.2098, "step": 23082 }, { "epoch": 0.7, "learning_rate": 1.1211933594303564e-06, "loss": 1.0721, "step": 23083 }, { "epoch": 0.7, "learning_rate": 1.120989897667345e-06, "loss": 1.0491, "step": 23084 }, { "epoch": 0.7, "learning_rate": 1.1207864490318467e-06, "loss": 1.0632, "step": 23085 }, { "epoch": 0.7, "learning_rate": 1.1205830135257961e-06, "loss": 1.2452, "step": 23086 }, { "epoch": 0.7, "learning_rate": 1.120379591151131e-06, "loss": 1.0984, "step": 23087 }, { "epoch": 0.7, "learning_rate": 1.120176181909788e-06, "loss": 1.0287, "step": 23088 }, { "epoch": 0.7, "learning_rate": 1.1199727858037035e-06, "loss": 1.0284, "step": 23089 }, { "epoch": 0.7, "learning_rate": 1.119769402834813e-06, "loss": 0.9761, "step": 23090 }, { "epoch": 0.7, "learning_rate": 1.119566033005053e-06, "loss": 1.0588, "step": 23091 }, { "epoch": 0.7, "learning_rate": 1.1193626763163593e-06, "loss": 1.088, "step": 23092 }, { "epoch": 0.7, "learning_rate": 1.119159332770669e-06, "loss": 1.1542, "step": 23093 }, { "epoch": 0.7, "learning_rate": 1.1189560023699159e-06, "loss": 1.1822, "step": 23094 }, { "epoch": 0.7, "learning_rate": 1.1187526851160365e-06, "loss": 0.9824, "step": 23095 }, { "epoch": 0.7, "learning_rate": 1.1185493810109664e-06, "loss": 1.1064, "step": 23096 }, { "epoch": 0.7, "learning_rate": 1.1183460900566407e-06, "loss": 1.0474, "step": 23097 }, { "epoch": 0.7, "learning_rate": 1.118142812254996e-06, "loss": 1.1362, "step": 23098 }, { "epoch": 0.7, "learning_rate": 1.117939547607965e-06, "loss": 1.1454, "step": 23099 }, { "epoch": 0.7, "learning_rate": 1.117736296117484e-06, "loss": 1.1829, "step": 23100 }, { "epoch": 0.7, "learning_rate": 1.1175330577854876e-06, "loss": 1.061, "step": 23101 }, { "epoch": 0.7, "learning_rate": 1.1173298326139118e-06, "loss": 1.0728, "step": 23102 }, { "epoch": 0.7, "learning_rate": 1.117126620604689e-06, "loss": 1.0634, "step": 23103 }, { "epoch": 0.7, "learning_rate": 1.1169234217597549e-06, "loss": 1.072, "step": 23104 }, { "epoch": 0.7, "learning_rate": 1.1167202360810437e-06, "loss": 1.1802, "step": 23105 }, { "epoch": 0.7, "learning_rate": 1.1165170635704894e-06, "loss": 1.0425, "step": 23106 }, { "epoch": 0.7, "learning_rate": 1.1163139042300267e-06, "loss": 0.9874, "step": 23107 }, { "epoch": 0.7, "learning_rate": 1.1161107580615887e-06, "loss": 1.0184, "step": 23108 }, { "epoch": 0.7, "learning_rate": 1.1159076250671102e-06, "loss": 1.0765, "step": 23109 }, { "epoch": 0.7, "learning_rate": 1.1157045052485247e-06, "loss": 1.1082, "step": 23110 }, { "epoch": 0.7, "learning_rate": 1.1155013986077662e-06, "loss": 1.085, "step": 23111 }, { "epoch": 0.7, "learning_rate": 1.1152983051467667e-06, "loss": 1.1938, "step": 23112 }, { "epoch": 0.7, "learning_rate": 1.1150952248674604e-06, "loss": 1.1004, "step": 23113 }, { "epoch": 0.7, "learning_rate": 1.1148921577717806e-06, "loss": 1.1223, "step": 23114 }, { "epoch": 0.7, "learning_rate": 1.1146891038616615e-06, "loss": 1.0513, "step": 23115 }, { "epoch": 0.7, "learning_rate": 1.1144860631390337e-06, "loss": 1.0989, "step": 23116 }, { "epoch": 0.7, "learning_rate": 1.1142830356058315e-06, "loss": 1.0717, "step": 23117 }, { "epoch": 0.7, "learning_rate": 1.1140800212639875e-06, "loss": 1.0792, "step": 23118 }, { "epoch": 0.7, "learning_rate": 1.1138770201154348e-06, "loss": 1.2072, "step": 23119 }, { "epoch": 0.7, "learning_rate": 1.1136740321621046e-06, "loss": 1.0024, "step": 23120 }, { "epoch": 0.7, "learning_rate": 1.11347105740593e-06, "loss": 1.1379, "step": 23121 }, { "epoch": 0.7, "learning_rate": 1.1132680958488428e-06, "loss": 1.0991, "step": 23122 }, { "epoch": 0.7, "learning_rate": 1.113065147492776e-06, "loss": 1.127, "step": 23123 }, { "epoch": 0.7, "learning_rate": 1.1128622123396616e-06, "loss": 1.0203, "step": 23124 }, { "epoch": 0.7, "learning_rate": 1.1126592903914299e-06, "loss": 1.0831, "step": 23125 }, { "epoch": 0.7, "learning_rate": 1.1124563816500137e-06, "loss": 1.1544, "step": 23126 }, { "epoch": 0.7, "learning_rate": 1.1122534861173445e-06, "loss": 1.0595, "step": 23127 }, { "epoch": 0.7, "learning_rate": 1.1120506037953546e-06, "loss": 1.151, "step": 23128 }, { "epoch": 0.7, "learning_rate": 1.1118477346859737e-06, "loss": 1.0624, "step": 23129 }, { "epoch": 0.7, "learning_rate": 1.1116448787911339e-06, "loss": 1.1458, "step": 23130 }, { "epoch": 0.7, "learning_rate": 1.111442036112766e-06, "loss": 1.0674, "step": 23131 }, { "epoch": 0.7, "learning_rate": 1.111239206652801e-06, "loss": 1.0565, "step": 23132 }, { "epoch": 0.7, "learning_rate": 1.11103639041317e-06, "loss": 1.0894, "step": 23133 }, { "epoch": 0.7, "learning_rate": 1.110833587395804e-06, "loss": 0.9564, "step": 23134 }, { "epoch": 0.7, "learning_rate": 1.1106307976026328e-06, "loss": 1.0522, "step": 23135 }, { "epoch": 0.7, "learning_rate": 1.1104280210355871e-06, "loss": 1.2006, "step": 23136 }, { "epoch": 0.7, "learning_rate": 1.1102252576965988e-06, "loss": 1.0871, "step": 23137 }, { "epoch": 0.7, "learning_rate": 1.1100225075875956e-06, "loss": 1.1307, "step": 23138 }, { "epoch": 0.7, "learning_rate": 1.1098197707105087e-06, "loss": 1.1278, "step": 23139 }, { "epoch": 0.7, "learning_rate": 1.109617047067268e-06, "loss": 0.9947, "step": 23140 }, { "epoch": 0.7, "learning_rate": 1.1094143366598042e-06, "loss": 1.0858, "step": 23141 }, { "epoch": 0.7, "learning_rate": 1.1092116394900457e-06, "loss": 1.1146, "step": 23142 }, { "epoch": 0.7, "learning_rate": 1.109008955559922e-06, "loss": 1.1772, "step": 23143 }, { "epoch": 0.7, "learning_rate": 1.1088062848713636e-06, "loss": 1.0555, "step": 23144 }, { "epoch": 0.7, "learning_rate": 1.1086036274262998e-06, "loss": 1.1117, "step": 23145 }, { "epoch": 0.7, "learning_rate": 1.1084009832266587e-06, "loss": 1.0289, "step": 23146 }, { "epoch": 0.7, "learning_rate": 1.10819835227437e-06, "loss": 1.1471, "step": 23147 }, { "epoch": 0.7, "learning_rate": 1.1079957345713627e-06, "loss": 1.0048, "step": 23148 }, { "epoch": 0.7, "learning_rate": 1.1077931301195658e-06, "loss": 1.1194, "step": 23149 }, { "epoch": 0.7, "learning_rate": 1.1075905389209082e-06, "loss": 1.1056, "step": 23150 }, { "epoch": 0.7, "learning_rate": 1.1073879609773175e-06, "loss": 1.1258, "step": 23151 }, { "epoch": 0.7, "learning_rate": 1.1071853962907226e-06, "loss": 1.1428, "step": 23152 }, { "epoch": 0.7, "learning_rate": 1.106982844863052e-06, "loss": 1.0398, "step": 23153 }, { "epoch": 0.7, "learning_rate": 1.1067803066962347e-06, "loss": 1.022, "step": 23154 }, { "epoch": 0.7, "learning_rate": 1.106577781792197e-06, "loss": 1.1111, "step": 23155 }, { "epoch": 0.7, "learning_rate": 1.1063752701528676e-06, "loss": 1.05, "step": 23156 }, { "epoch": 0.7, "learning_rate": 1.1061727717801746e-06, "loss": 1.0698, "step": 23157 }, { "epoch": 0.7, "learning_rate": 1.1059702866760452e-06, "loss": 1.0977, "step": 23158 }, { "epoch": 0.7, "learning_rate": 1.1057678148424086e-06, "loss": 1.069, "step": 23159 }, { "epoch": 0.7, "learning_rate": 1.1055653562811897e-06, "loss": 0.9819, "step": 23160 }, { "epoch": 0.7, "learning_rate": 1.1053629109943173e-06, "loss": 1.1203, "step": 23161 }, { "epoch": 0.7, "learning_rate": 1.105160478983718e-06, "loss": 1.0517, "step": 23162 }, { "epoch": 0.7, "learning_rate": 1.1049580602513192e-06, "loss": 1.0976, "step": 23163 }, { "epoch": 0.7, "learning_rate": 1.1047556547990482e-06, "loss": 1.085, "step": 23164 }, { "epoch": 0.7, "learning_rate": 1.104553262628831e-06, "loss": 1.0063, "step": 23165 }, { "epoch": 0.7, "learning_rate": 1.1043508837425948e-06, "loss": 1.0366, "step": 23166 }, { "epoch": 0.7, "learning_rate": 1.104148518142267e-06, "loss": 0.9575, "step": 23167 }, { "epoch": 0.7, "learning_rate": 1.103946165829772e-06, "loss": 1.2103, "step": 23168 }, { "epoch": 0.7, "learning_rate": 1.1037438268070372e-06, "loss": 1.1337, "step": 23169 }, { "epoch": 0.7, "learning_rate": 1.1035415010759886e-06, "loss": 1.1536, "step": 23170 }, { "epoch": 0.7, "learning_rate": 1.1033391886385533e-06, "loss": 1.0427, "step": 23171 }, { "epoch": 0.7, "learning_rate": 1.1031368894966554e-06, "loss": 1.0988, "step": 23172 }, { "epoch": 0.7, "learning_rate": 1.1029346036522214e-06, "loss": 1.0406, "step": 23173 }, { "epoch": 0.7, "learning_rate": 1.1027323311071775e-06, "loss": 1.1959, "step": 23174 }, { "epoch": 0.7, "learning_rate": 1.1025300718634497e-06, "loss": 1.1653, "step": 23175 }, { "epoch": 0.7, "learning_rate": 1.1023278259229615e-06, "loss": 1.1497, "step": 23176 }, { "epoch": 0.7, "learning_rate": 1.1021255932876392e-06, "loss": 1.1265, "step": 23177 }, { "epoch": 0.7, "learning_rate": 1.1019233739594081e-06, "loss": 1.0702, "step": 23178 }, { "epoch": 0.7, "learning_rate": 1.1017211679401932e-06, "loss": 1.061, "step": 23179 }, { "epoch": 0.7, "learning_rate": 1.10151897523192e-06, "loss": 1.1485, "step": 23180 }, { "epoch": 0.7, "learning_rate": 1.101316795836512e-06, "loss": 1.1893, "step": 23181 }, { "epoch": 0.7, "learning_rate": 1.1011146297558945e-06, "loss": 1.0677, "step": 23182 }, { "epoch": 0.7, "learning_rate": 1.100912476991992e-06, "loss": 1.1249, "step": 23183 }, { "epoch": 0.7, "learning_rate": 1.1007103375467293e-06, "loss": 1.0903, "step": 23184 }, { "epoch": 0.7, "learning_rate": 1.1005082114220296e-06, "loss": 1.052, "step": 23185 }, { "epoch": 0.7, "learning_rate": 1.100306098619818e-06, "loss": 1.1368, "step": 23186 }, { "epoch": 0.7, "learning_rate": 1.100103999142018e-06, "loss": 1.2662, "step": 23187 }, { "epoch": 0.7, "learning_rate": 1.0999019129905538e-06, "loss": 1.132, "step": 23188 }, { "epoch": 0.7, "learning_rate": 1.0996998401673492e-06, "loss": 1.0578, "step": 23189 }, { "epoch": 0.7, "learning_rate": 1.0994977806743276e-06, "loss": 1.0809, "step": 23190 }, { "epoch": 0.7, "learning_rate": 1.0992957345134125e-06, "loss": 1.1045, "step": 23191 }, { "epoch": 0.7, "learning_rate": 1.0990937016865275e-06, "loss": 1.0834, "step": 23192 }, { "epoch": 0.7, "learning_rate": 1.0988916821955967e-06, "loss": 1.1629, "step": 23193 }, { "epoch": 0.7, "learning_rate": 1.0986896760425414e-06, "loss": 1.2087, "step": 23194 }, { "epoch": 0.7, "learning_rate": 1.0984876832292853e-06, "loss": 1.0912, "step": 23195 }, { "epoch": 0.7, "learning_rate": 1.098285703757752e-06, "loss": 1.1219, "step": 23196 }, { "epoch": 0.7, "learning_rate": 1.098083737629864e-06, "loss": 1.1106, "step": 23197 }, { "epoch": 0.7, "learning_rate": 1.097881784847543e-06, "loss": 1.1434, "step": 23198 }, { "epoch": 0.7, "learning_rate": 1.097679845412712e-06, "loss": 1.1579, "step": 23199 }, { "epoch": 0.7, "learning_rate": 1.0974779193272937e-06, "loss": 1.2173, "step": 23200 }, { "epoch": 0.7, "learning_rate": 1.097276006593211e-06, "loss": 1.1439, "step": 23201 }, { "epoch": 0.7, "learning_rate": 1.0970741072123838e-06, "loss": 1.0787, "step": 23202 }, { "epoch": 0.7, "learning_rate": 1.0968722211867358e-06, "loss": 1.1813, "step": 23203 }, { "epoch": 0.7, "learning_rate": 1.0966703485181887e-06, "loss": 1.0087, "step": 23204 }, { "epoch": 0.7, "learning_rate": 1.0964684892086635e-06, "loss": 1.1247, "step": 23205 }, { "epoch": 0.7, "learning_rate": 1.0962666432600836e-06, "loss": 1.1813, "step": 23206 }, { "epoch": 0.7, "learning_rate": 1.0960648106743683e-06, "loss": 1.1237, "step": 23207 }, { "epoch": 0.7, "learning_rate": 1.0958629914534397e-06, "loss": 1.1188, "step": 23208 }, { "epoch": 0.7, "learning_rate": 1.0956611855992191e-06, "loss": 1.1592, "step": 23209 }, { "epoch": 0.7, "learning_rate": 1.0954593931136287e-06, "loss": 1.0851, "step": 23210 }, { "epoch": 0.7, "learning_rate": 1.0952576139985875e-06, "loss": 1.0436, "step": 23211 }, { "epoch": 0.7, "learning_rate": 1.0950558482560172e-06, "loss": 1.1816, "step": 23212 }, { "epoch": 0.7, "learning_rate": 1.0948540958878387e-06, "loss": 1.221, "step": 23213 }, { "epoch": 0.7, "learning_rate": 1.0946523568959724e-06, "loss": 1.0831, "step": 23214 }, { "epoch": 0.7, "learning_rate": 1.0944506312823388e-06, "loss": 1.1783, "step": 23215 }, { "epoch": 0.7, "learning_rate": 1.0942489190488583e-06, "loss": 1.161, "step": 23216 }, { "epoch": 0.7, "learning_rate": 1.0940472201974508e-06, "loss": 1.145, "step": 23217 }, { "epoch": 0.7, "learning_rate": 1.093845534730037e-06, "loss": 1.056, "step": 23218 }, { "epoch": 0.7, "learning_rate": 1.0936438626485374e-06, "loss": 1.1945, "step": 23219 }, { "epoch": 0.7, "learning_rate": 1.0934422039548699e-06, "loss": 1.0659, "step": 23220 }, { "epoch": 0.7, "learning_rate": 1.0932405586509551e-06, "loss": 1.063, "step": 23221 }, { "epoch": 0.7, "learning_rate": 1.0930389267387126e-06, "loss": 0.9824, "step": 23222 }, { "epoch": 0.7, "learning_rate": 1.092837308220063e-06, "loss": 1.1447, "step": 23223 }, { "epoch": 0.7, "learning_rate": 1.0926357030969234e-06, "loss": 1.1447, "step": 23224 }, { "epoch": 0.7, "learning_rate": 1.0924341113712142e-06, "loss": 1.2352, "step": 23225 }, { "epoch": 0.7, "learning_rate": 1.0922325330448545e-06, "loss": 1.139, "step": 23226 }, { "epoch": 0.7, "learning_rate": 1.0920309681197639e-06, "loss": 1.1517, "step": 23227 }, { "epoch": 0.7, "learning_rate": 1.0918294165978594e-06, "loss": 0.9886, "step": 23228 }, { "epoch": 0.7, "learning_rate": 1.0916278784810607e-06, "loss": 1.0562, "step": 23229 }, { "epoch": 0.7, "learning_rate": 1.0914263537712862e-06, "loss": 1.1584, "step": 23230 }, { "epoch": 0.7, "learning_rate": 1.0912248424704543e-06, "loss": 1.0961, "step": 23231 }, { "epoch": 0.7, "learning_rate": 1.0910233445804846e-06, "loss": 1.075, "step": 23232 }, { "epoch": 0.7, "learning_rate": 1.0908218601032932e-06, "loss": 1.149, "step": 23233 }, { "epoch": 0.7, "learning_rate": 1.090620389040799e-06, "loss": 1.1226, "step": 23234 }, { "epoch": 0.7, "learning_rate": 1.09041893139492e-06, "loss": 1.1697, "step": 23235 }, { "epoch": 0.7, "learning_rate": 1.0902174871675744e-06, "loss": 1.0967, "step": 23236 }, { "epoch": 0.7, "learning_rate": 1.0900160563606786e-06, "loss": 1.1583, "step": 23237 }, { "epoch": 0.7, "learning_rate": 1.0898146389761511e-06, "loss": 1.1682, "step": 23238 }, { "epoch": 0.7, "learning_rate": 1.089613235015909e-06, "loss": 1.0896, "step": 23239 }, { "epoch": 0.7, "learning_rate": 1.0894118444818693e-06, "loss": 1.0851, "step": 23240 }, { "epoch": 0.7, "learning_rate": 1.08921046737595e-06, "loss": 1.1207, "step": 23241 }, { "epoch": 0.7, "learning_rate": 1.089009103700068e-06, "loss": 1.0463, "step": 23242 }, { "epoch": 0.7, "learning_rate": 1.0888077534561392e-06, "loss": 1.1697, "step": 23243 }, { "epoch": 0.7, "learning_rate": 1.0886064166460808e-06, "loss": 1.1617, "step": 23244 }, { "epoch": 0.7, "learning_rate": 1.0884050932718097e-06, "loss": 1.1864, "step": 23245 }, { "epoch": 0.7, "learning_rate": 1.0882037833352417e-06, "loss": 0.985, "step": 23246 }, { "epoch": 0.7, "learning_rate": 1.0880024868382944e-06, "loss": 1.0269, "step": 23247 }, { "epoch": 0.7, "learning_rate": 1.0878012037828831e-06, "loss": 1.175, "step": 23248 }, { "epoch": 0.7, "learning_rate": 1.0875999341709253e-06, "loss": 1.2622, "step": 23249 }, { "epoch": 0.7, "learning_rate": 1.087398678004335e-06, "loss": 1.092, "step": 23250 }, { "epoch": 0.7, "learning_rate": 1.0871974352850288e-06, "loss": 1.0773, "step": 23251 }, { "epoch": 0.7, "learning_rate": 1.0869962060149225e-06, "loss": 1.2125, "step": 23252 }, { "epoch": 0.7, "learning_rate": 1.0867949901959326e-06, "loss": 1.1725, "step": 23253 }, { "epoch": 0.7, "learning_rate": 1.0865937878299732e-06, "loss": 1.2433, "step": 23254 }, { "epoch": 0.7, "learning_rate": 1.0863925989189602e-06, "loss": 1.0915, "step": 23255 }, { "epoch": 0.7, "learning_rate": 1.0861914234648085e-06, "loss": 1.051, "step": 23256 }, { "epoch": 0.7, "learning_rate": 1.085990261469434e-06, "loss": 1.0469, "step": 23257 }, { "epoch": 0.7, "learning_rate": 1.0857891129347516e-06, "loss": 1.093, "step": 23258 }, { "epoch": 0.7, "learning_rate": 1.0855879778626753e-06, "loss": 1.1578, "step": 23259 }, { "epoch": 0.7, "learning_rate": 1.0853868562551202e-06, "loss": 1.1022, "step": 23260 }, { "epoch": 0.7, "learning_rate": 1.0851857481140007e-06, "loss": 1.0418, "step": 23261 }, { "epoch": 0.7, "learning_rate": 1.0849846534412323e-06, "loss": 1.0846, "step": 23262 }, { "epoch": 0.7, "learning_rate": 1.0847835722387279e-06, "loss": 1.0436, "step": 23263 }, { "epoch": 0.7, "learning_rate": 1.0845825045084021e-06, "loss": 1.0697, "step": 23264 }, { "epoch": 0.7, "learning_rate": 1.0843814502521693e-06, "loss": 1.1638, "step": 23265 }, { "epoch": 0.7, "learning_rate": 1.084180409471944e-06, "loss": 1.1063, "step": 23266 }, { "epoch": 0.7, "learning_rate": 1.0839793821696388e-06, "loss": 1.1982, "step": 23267 }, { "epoch": 0.7, "learning_rate": 1.0837783683471675e-06, "loss": 1.1529, "step": 23268 }, { "epoch": 0.7, "learning_rate": 1.0835773680064444e-06, "loss": 1.075, "step": 23269 }, { "epoch": 0.7, "learning_rate": 1.0833763811493822e-06, "loss": 0.9865, "step": 23270 }, { "epoch": 0.7, "learning_rate": 1.0831754077778946e-06, "loss": 1.0597, "step": 23271 }, { "epoch": 0.7, "learning_rate": 1.082974447893895e-06, "loss": 0.9672, "step": 23272 }, { "epoch": 0.7, "learning_rate": 1.0827735014992962e-06, "loss": 1.144, "step": 23273 }, { "epoch": 0.7, "learning_rate": 1.0825725685960112e-06, "loss": 1.1439, "step": 23274 }, { "epoch": 0.7, "learning_rate": 1.0823716491859533e-06, "loss": 1.1697, "step": 23275 }, { "epoch": 0.7, "learning_rate": 1.0821707432710339e-06, "loss": 1.1501, "step": 23276 }, { "epoch": 0.7, "learning_rate": 1.081969850853166e-06, "loss": 1.0356, "step": 23277 }, { "epoch": 0.7, "learning_rate": 1.0817689719342623e-06, "loss": 1.1794, "step": 23278 }, { "epoch": 0.7, "learning_rate": 1.0815681065162355e-06, "loss": 1.1574, "step": 23279 }, { "epoch": 0.7, "learning_rate": 1.0813672546009967e-06, "loss": 1.1833, "step": 23280 }, { "epoch": 0.7, "learning_rate": 1.0811664161904584e-06, "loss": 1.0623, "step": 23281 }, { "epoch": 0.7, "learning_rate": 1.080965591286532e-06, "loss": 1.122, "step": 23282 }, { "epoch": 0.7, "learning_rate": 1.0807647798911302e-06, "loss": 1.121, "step": 23283 }, { "epoch": 0.7, "learning_rate": 1.080563982006165e-06, "loss": 1.1375, "step": 23284 }, { "epoch": 0.7, "learning_rate": 1.080363197633546e-06, "loss": 1.0851, "step": 23285 }, { "epoch": 0.7, "learning_rate": 1.0801624267751858e-06, "loss": 1.1438, "step": 23286 }, { "epoch": 0.7, "learning_rate": 1.0799616694329954e-06, "loss": 0.9787, "step": 23287 }, { "epoch": 0.7, "learning_rate": 1.079760925608887e-06, "loss": 1.1509, "step": 23288 }, { "epoch": 0.7, "learning_rate": 1.0795601953047696e-06, "loss": 1.074, "step": 23289 }, { "epoch": 0.7, "learning_rate": 1.079359478522555e-06, "loss": 1.0218, "step": 23290 }, { "epoch": 0.7, "learning_rate": 1.079158775264154e-06, "loss": 1.1589, "step": 23291 }, { "epoch": 0.7, "learning_rate": 1.0789580855314779e-06, "loss": 1.1074, "step": 23292 }, { "epoch": 0.7, "learning_rate": 1.0787574093264358e-06, "loss": 1.1411, "step": 23293 }, { "epoch": 0.7, "learning_rate": 1.0785567466509386e-06, "loss": 1.0684, "step": 23294 }, { "epoch": 0.7, "learning_rate": 1.0783560975068965e-06, "loss": 1.1047, "step": 23295 }, { "epoch": 0.7, "learning_rate": 1.0781554618962197e-06, "loss": 1.0259, "step": 23296 }, { "epoch": 0.7, "learning_rate": 1.0779548398208182e-06, "loss": 1.035, "step": 23297 }, { "epoch": 0.7, "learning_rate": 1.0777542312826017e-06, "loss": 1.0641, "step": 23298 }, { "epoch": 0.7, "learning_rate": 1.07755363628348e-06, "loss": 1.163, "step": 23299 }, { "epoch": 0.7, "learning_rate": 1.0773530548253623e-06, "loss": 1.1041, "step": 23300 }, { "epoch": 0.7, "learning_rate": 1.0771524869101594e-06, "loss": 0.9713, "step": 23301 }, { "epoch": 0.7, "learning_rate": 1.0769519325397787e-06, "loss": 1.0789, "step": 23302 }, { "epoch": 0.7, "learning_rate": 1.0767513917161303e-06, "loss": 1.1328, "step": 23303 }, { "epoch": 0.7, "learning_rate": 1.0765508644411232e-06, "loss": 1.0689, "step": 23304 }, { "epoch": 0.7, "learning_rate": 1.076350350716667e-06, "loss": 1.1428, "step": 23305 }, { "epoch": 0.7, "learning_rate": 1.076149850544669e-06, "loss": 1.1218, "step": 23306 }, { "epoch": 0.7, "learning_rate": 1.0759493639270388e-06, "loss": 1.0497, "step": 23307 }, { "epoch": 0.7, "learning_rate": 1.0757488908656849e-06, "loss": 1.1609, "step": 23308 }, { "epoch": 0.7, "learning_rate": 1.0755484313625152e-06, "loss": 1.1219, "step": 23309 }, { "epoch": 0.7, "learning_rate": 1.07534798541944e-06, "loss": 1.1343, "step": 23310 }, { "epoch": 0.7, "learning_rate": 1.0751475530383644e-06, "loss": 1.1818, "step": 23311 }, { "epoch": 0.7, "learning_rate": 1.0749471342211977e-06, "loss": 1.1133, "step": 23312 }, { "epoch": 0.7, "learning_rate": 1.0747467289698484e-06, "loss": 0.9638, "step": 23313 }, { "epoch": 0.7, "learning_rate": 1.0745463372862244e-06, "loss": 1.1371, "step": 23314 }, { "epoch": 0.7, "learning_rate": 1.074345959172232e-06, "loss": 1.1194, "step": 23315 }, { "epoch": 0.7, "learning_rate": 1.0741455946297796e-06, "loss": 1.1097, "step": 23316 }, { "epoch": 0.7, "learning_rate": 1.0739452436607741e-06, "loss": 1.0234, "step": 23317 }, { "epoch": 0.7, "learning_rate": 1.0737449062671244e-06, "loss": 1.1505, "step": 23318 }, { "epoch": 0.7, "learning_rate": 1.073544582450735e-06, "loss": 1.079, "step": 23319 }, { "epoch": 0.7, "learning_rate": 1.0733442722135144e-06, "loss": 1.0415, "step": 23320 }, { "epoch": 0.7, "learning_rate": 1.073143975557369e-06, "loss": 1.0857, "step": 23321 }, { "epoch": 0.7, "learning_rate": 1.0729436924842058e-06, "loss": 1.0425, "step": 23322 }, { "epoch": 0.7, "learning_rate": 1.0727434229959313e-06, "loss": 1.1305, "step": 23323 }, { "epoch": 0.7, "learning_rate": 1.072543167094453e-06, "loss": 1.2446, "step": 23324 }, { "epoch": 0.7, "learning_rate": 1.0723429247816754e-06, "loss": 1.0834, "step": 23325 }, { "epoch": 0.7, "learning_rate": 1.0721426960595057e-06, "loss": 1.085, "step": 23326 }, { "epoch": 0.7, "learning_rate": 1.0719424809298495e-06, "loss": 1.0314, "step": 23327 }, { "epoch": 0.7, "learning_rate": 1.0717422793946136e-06, "loss": 1.0579, "step": 23328 }, { "epoch": 0.7, "learning_rate": 1.0715420914557028e-06, "loss": 1.0589, "step": 23329 }, { "epoch": 0.7, "learning_rate": 1.0713419171150238e-06, "loss": 1.142, "step": 23330 }, { "epoch": 0.7, "learning_rate": 1.0711417563744822e-06, "loss": 1.0801, "step": 23331 }, { "epoch": 0.7, "learning_rate": 1.0709416092359824e-06, "loss": 1.1315, "step": 23332 }, { "epoch": 0.7, "learning_rate": 1.0707414757014299e-06, "loss": 1.1127, "step": 23333 }, { "epoch": 0.7, "learning_rate": 1.0705413557727303e-06, "loss": 1.0547, "step": 23334 }, { "epoch": 0.7, "learning_rate": 1.0703412494517885e-06, "loss": 1.1158, "step": 23335 }, { "epoch": 0.7, "learning_rate": 1.0701411567405104e-06, "loss": 1.182, "step": 23336 }, { "epoch": 0.7, "learning_rate": 1.069941077640799e-06, "loss": 1.2079, "step": 23337 }, { "epoch": 0.7, "learning_rate": 1.0697410121545596e-06, "loss": 0.9655, "step": 23338 }, { "epoch": 0.7, "learning_rate": 1.069540960283697e-06, "loss": 1.1065, "step": 23339 }, { "epoch": 0.7, "learning_rate": 1.0693409220301168e-06, "loss": 1.1406, "step": 23340 }, { "epoch": 0.7, "learning_rate": 1.0691408973957207e-06, "loss": 1.1609, "step": 23341 }, { "epoch": 0.7, "learning_rate": 1.0689408863824141e-06, "loss": 1.0563, "step": 23342 }, { "epoch": 0.7, "learning_rate": 1.068740888992101e-06, "loss": 1.2198, "step": 23343 }, { "epoch": 0.7, "learning_rate": 1.0685409052266866e-06, "loss": 1.1319, "step": 23344 }, { "epoch": 0.7, "learning_rate": 1.068340935088072e-06, "loss": 1.0779, "step": 23345 }, { "epoch": 0.7, "learning_rate": 1.0681409785781626e-06, "loss": 1.0462, "step": 23346 }, { "epoch": 0.7, "learning_rate": 1.0679410356988615e-06, "loss": 1.0656, "step": 23347 }, { "epoch": 0.7, "learning_rate": 1.0677411064520719e-06, "loss": 1.1127, "step": 23348 }, { "epoch": 0.7, "learning_rate": 1.067541190839698e-06, "loss": 1.0733, "step": 23349 }, { "epoch": 0.7, "learning_rate": 1.0673412888636411e-06, "loss": 1.1926, "step": 23350 }, { "epoch": 0.7, "learning_rate": 1.0671414005258052e-06, "loss": 1.1609, "step": 23351 }, { "epoch": 0.7, "learning_rate": 1.066941525828093e-06, "loss": 1.1594, "step": 23352 }, { "epoch": 0.7, "learning_rate": 1.0667416647724075e-06, "loss": 1.0285, "step": 23353 }, { "epoch": 0.7, "learning_rate": 1.066541817360651e-06, "loss": 1.1921, "step": 23354 }, { "epoch": 0.7, "learning_rate": 1.0663419835947258e-06, "loss": 1.1053, "step": 23355 }, { "epoch": 0.7, "learning_rate": 1.0661421634765348e-06, "loss": 1.3097, "step": 23356 }, { "epoch": 0.7, "learning_rate": 1.0659423570079806e-06, "loss": 1.2325, "step": 23357 }, { "epoch": 0.7, "learning_rate": 1.0657425641909636e-06, "loss": 1.0502, "step": 23358 }, { "epoch": 0.7, "learning_rate": 1.0655427850273864e-06, "loss": 1.0055, "step": 23359 }, { "epoch": 0.7, "learning_rate": 1.065343019519151e-06, "loss": 1.1514, "step": 23360 }, { "epoch": 0.7, "learning_rate": 1.0651432676681605e-06, "loss": 1.0567, "step": 23361 }, { "epoch": 0.7, "learning_rate": 1.064943529476314e-06, "loss": 1.1303, "step": 23362 }, { "epoch": 0.7, "learning_rate": 1.0647438049455137e-06, "loss": 1.1095, "step": 23363 }, { "epoch": 0.7, "learning_rate": 1.064544094077661e-06, "loss": 1.0092, "step": 23364 }, { "epoch": 0.7, "learning_rate": 1.0643443968746575e-06, "loss": 1.1025, "step": 23365 }, { "epoch": 0.7, "learning_rate": 1.0641447133384047e-06, "loss": 1.1228, "step": 23366 }, { "epoch": 0.7, "learning_rate": 1.0639450434708018e-06, "loss": 1.0981, "step": 23367 }, { "epoch": 0.7, "learning_rate": 1.0637453872737505e-06, "loss": 1.1781, "step": 23368 }, { "epoch": 0.7, "learning_rate": 1.0635457447491515e-06, "loss": 1.0623, "step": 23369 }, { "epoch": 0.7, "learning_rate": 1.0633461158989058e-06, "loss": 1.0364, "step": 23370 }, { "epoch": 0.7, "learning_rate": 1.0631465007249126e-06, "loss": 1.1947, "step": 23371 }, { "epoch": 0.7, "learning_rate": 1.0629468992290726e-06, "loss": 1.084, "step": 23372 }, { "epoch": 0.7, "learning_rate": 1.0627473114132858e-06, "loss": 1.2218, "step": 23373 }, { "epoch": 0.7, "learning_rate": 1.0625477372794536e-06, "loss": 1.1915, "step": 23374 }, { "epoch": 0.7, "learning_rate": 1.0623481768294734e-06, "loss": 1.1951, "step": 23375 }, { "epoch": 0.7, "learning_rate": 1.0621486300652465e-06, "loss": 1.1279, "step": 23376 }, { "epoch": 0.7, "learning_rate": 1.0619490969886716e-06, "loss": 1.0981, "step": 23377 }, { "epoch": 0.7, "learning_rate": 1.0617495776016493e-06, "loss": 1.0385, "step": 23378 }, { "epoch": 0.7, "learning_rate": 1.061550071906078e-06, "loss": 1.0572, "step": 23379 }, { "epoch": 0.7, "learning_rate": 1.0613505799038573e-06, "loss": 1.142, "step": 23380 }, { "epoch": 0.7, "learning_rate": 1.0611511015968864e-06, "loss": 1.1304, "step": 23381 }, { "epoch": 0.7, "learning_rate": 1.060951636987064e-06, "loss": 1.0731, "step": 23382 }, { "epoch": 0.7, "learning_rate": 1.0607521860762896e-06, "loss": 1.0798, "step": 23383 }, { "epoch": 0.7, "learning_rate": 1.0605527488664605e-06, "loss": 1.0499, "step": 23384 }, { "epoch": 0.7, "learning_rate": 1.0603533253594757e-06, "loss": 1.1272, "step": 23385 }, { "epoch": 0.7, "learning_rate": 1.0601539155572344e-06, "loss": 1.0792, "step": 23386 }, { "epoch": 0.7, "learning_rate": 1.0599545194616347e-06, "loss": 1.1152, "step": 23387 }, { "epoch": 0.7, "learning_rate": 1.059755137074574e-06, "loss": 1.2581, "step": 23388 }, { "epoch": 0.7, "learning_rate": 1.0595557683979505e-06, "loss": 1.1027, "step": 23389 }, { "epoch": 0.7, "learning_rate": 1.0593564134336626e-06, "loss": 0.9985, "step": 23390 }, { "epoch": 0.7, "learning_rate": 1.0591570721836076e-06, "loss": 1.0909, "step": 23391 }, { "epoch": 0.7, "learning_rate": 1.058957744649684e-06, "loss": 1.0554, "step": 23392 }, { "epoch": 0.7, "learning_rate": 1.058758430833788e-06, "loss": 1.2074, "step": 23393 }, { "epoch": 0.7, "learning_rate": 1.0585591307378177e-06, "loss": 1.0688, "step": 23394 }, { "epoch": 0.7, "learning_rate": 1.0583598443636703e-06, "loss": 1.1241, "step": 23395 }, { "epoch": 0.7, "learning_rate": 1.0581605717132434e-06, "loss": 1.1271, "step": 23396 }, { "epoch": 0.7, "learning_rate": 1.0579613127884328e-06, "loss": 1.09, "step": 23397 }, { "epoch": 0.7, "learning_rate": 1.057762067591136e-06, "loss": 1.0529, "step": 23398 }, { "epoch": 0.7, "learning_rate": 1.0575628361232496e-06, "loss": 1.2007, "step": 23399 }, { "epoch": 0.7, "learning_rate": 1.0573636183866714e-06, "loss": 1.0645, "step": 23400 }, { "epoch": 0.7, "learning_rate": 1.0571644143832956e-06, "loss": 1.1383, "step": 23401 }, { "epoch": 0.7, "learning_rate": 1.05696522411502e-06, "loss": 1.0056, "step": 23402 }, { "epoch": 0.71, "learning_rate": 1.0567660475837401e-06, "loss": 1.0992, "step": 23403 }, { "epoch": 0.71, "learning_rate": 1.0565668847913527e-06, "loss": 1.1415, "step": 23404 }, { "epoch": 0.71, "learning_rate": 1.0563677357397532e-06, "loss": 1.1946, "step": 23405 }, { "epoch": 0.71, "learning_rate": 1.0561686004308384e-06, "loss": 1.2043, "step": 23406 }, { "epoch": 0.71, "learning_rate": 1.0559694788665024e-06, "loss": 1.1409, "step": 23407 }, { "epoch": 0.71, "learning_rate": 1.0557703710486414e-06, "loss": 1.15, "step": 23408 }, { "epoch": 0.71, "learning_rate": 1.055571276979151e-06, "loss": 1.1855, "step": 23409 }, { "epoch": 0.71, "learning_rate": 1.0553721966599262e-06, "loss": 1.0435, "step": 23410 }, { "epoch": 0.71, "learning_rate": 1.0551731300928626e-06, "loss": 1.1065, "step": 23411 }, { "epoch": 0.71, "learning_rate": 1.0549740772798545e-06, "loss": 1.1057, "step": 23412 }, { "epoch": 0.71, "learning_rate": 1.0547750382227984e-06, "loss": 1.2678, "step": 23413 }, { "epoch": 0.71, "learning_rate": 1.0545760129235872e-06, "loss": 1.1301, "step": 23414 }, { "epoch": 0.71, "learning_rate": 1.054377001384116e-06, "loss": 1.1827, "step": 23415 }, { "epoch": 0.71, "learning_rate": 1.0541780036062792e-06, "loss": 1.1328, "step": 23416 }, { "epoch": 0.71, "learning_rate": 1.0539790195919723e-06, "loss": 1.0148, "step": 23417 }, { "epoch": 0.71, "learning_rate": 1.053780049343089e-06, "loss": 1.1999, "step": 23418 }, { "epoch": 0.71, "learning_rate": 1.0535810928615223e-06, "loss": 1.1912, "step": 23419 }, { "epoch": 0.71, "learning_rate": 1.053382150149167e-06, "loss": 1.1136, "step": 23420 }, { "epoch": 0.71, "learning_rate": 1.0531832212079169e-06, "loss": 1.0878, "step": 23421 }, { "epoch": 0.71, "learning_rate": 1.0529843060396667e-06, "loss": 1.1458, "step": 23422 }, { "epoch": 0.71, "learning_rate": 1.0527854046463078e-06, "loss": 1.0258, "step": 23423 }, { "epoch": 0.71, "learning_rate": 1.0525865170297353e-06, "loss": 1.0298, "step": 23424 }, { "epoch": 0.71, "learning_rate": 1.0523876431918418e-06, "loss": 1.1337, "step": 23425 }, { "epoch": 0.71, "learning_rate": 1.0521887831345217e-06, "loss": 1.239, "step": 23426 }, { "epoch": 0.71, "learning_rate": 1.0519899368596662e-06, "loss": 1.0947, "step": 23427 }, { "epoch": 0.71, "learning_rate": 1.0517911043691689e-06, "loss": 1.1742, "step": 23428 }, { "epoch": 0.71, "learning_rate": 1.051592285664923e-06, "loss": 1.1415, "step": 23429 }, { "epoch": 0.71, "learning_rate": 1.051393480748821e-06, "loss": 1.1246, "step": 23430 }, { "epoch": 0.71, "learning_rate": 1.0511946896227563e-06, "loss": 1.1547, "step": 23431 }, { "epoch": 0.71, "learning_rate": 1.0509959122886197e-06, "loss": 1.0674, "step": 23432 }, { "epoch": 0.71, "learning_rate": 1.0507971487483038e-06, "loss": 1.0419, "step": 23433 }, { "epoch": 0.71, "learning_rate": 1.050598399003701e-06, "loss": 1.0256, "step": 23434 }, { "epoch": 0.71, "learning_rate": 1.0503996630567036e-06, "loss": 1.1, "step": 23435 }, { "epoch": 0.71, "learning_rate": 1.0502009409092032e-06, "loss": 1.1637, "step": 23436 }, { "epoch": 0.71, "learning_rate": 1.0500022325630918e-06, "loss": 1.1584, "step": 23437 }, { "epoch": 0.71, "learning_rate": 1.0498035380202606e-06, "loss": 1.1539, "step": 23438 }, { "epoch": 0.71, "learning_rate": 1.049604857282602e-06, "loss": 1.0374, "step": 23439 }, { "epoch": 0.71, "learning_rate": 1.0494061903520062e-06, "loss": 1.0859, "step": 23440 }, { "epoch": 0.71, "learning_rate": 1.0492075372303646e-06, "loss": 1.052, "step": 23441 }, { "epoch": 0.71, "learning_rate": 1.0490088979195684e-06, "loss": 1.2067, "step": 23442 }, { "epoch": 0.71, "learning_rate": 1.0488102724215086e-06, "loss": 1.0821, "step": 23443 }, { "epoch": 0.71, "learning_rate": 1.0486116607380771e-06, "loss": 1.1718, "step": 23444 }, { "epoch": 0.71, "learning_rate": 1.0484130628711627e-06, "loss": 1.1365, "step": 23445 }, { "epoch": 0.71, "learning_rate": 1.048214478822657e-06, "loss": 1.1672, "step": 23446 }, { "epoch": 0.71, "learning_rate": 1.04801590859445e-06, "loss": 1.122, "step": 23447 }, { "epoch": 0.71, "learning_rate": 1.0478173521884333e-06, "loss": 1.09, "step": 23448 }, { "epoch": 0.71, "learning_rate": 1.0476188096064952e-06, "loss": 1.1216, "step": 23449 }, { "epoch": 0.71, "learning_rate": 1.0474202808505263e-06, "loss": 1.1671, "step": 23450 }, { "epoch": 0.71, "learning_rate": 1.0472217659224167e-06, "loss": 0.9888, "step": 23451 }, { "epoch": 0.71, "learning_rate": 1.0470232648240574e-06, "loss": 1.0866, "step": 23452 }, { "epoch": 0.71, "learning_rate": 1.0468247775573359e-06, "loss": 1.1267, "step": 23453 }, { "epoch": 0.71, "learning_rate": 1.0466263041241426e-06, "loss": 1.0219, "step": 23454 }, { "epoch": 0.71, "learning_rate": 1.0464278445263667e-06, "loss": 1.1815, "step": 23455 }, { "epoch": 0.71, "learning_rate": 1.0462293987658977e-06, "loss": 1.0685, "step": 23456 }, { "epoch": 0.71, "learning_rate": 1.0460309668446258e-06, "loss": 1.077, "step": 23457 }, { "epoch": 0.71, "learning_rate": 1.0458325487644378e-06, "loss": 1.0848, "step": 23458 }, { "epoch": 0.71, "learning_rate": 1.0456341445272236e-06, "loss": 1.0789, "step": 23459 }, { "epoch": 0.71, "learning_rate": 1.045435754134872e-06, "loss": 1.1421, "step": 23460 }, { "epoch": 0.71, "learning_rate": 1.0452373775892712e-06, "loss": 1.2532, "step": 23461 }, { "epoch": 0.71, "learning_rate": 1.0450390148923103e-06, "loss": 1.0635, "step": 23462 }, { "epoch": 0.71, "learning_rate": 1.044840666045877e-06, "loss": 1.0537, "step": 23463 }, { "epoch": 0.71, "learning_rate": 1.0446423310518596e-06, "loss": 1.1188, "step": 23464 }, { "epoch": 0.71, "learning_rate": 1.0444440099121475e-06, "loss": 1.1512, "step": 23465 }, { "epoch": 0.71, "learning_rate": 1.0442457026286264e-06, "loss": 1.1042, "step": 23466 }, { "epoch": 0.71, "learning_rate": 1.0440474092031852e-06, "loss": 1.1791, "step": 23467 }, { "epoch": 0.71, "learning_rate": 1.0438491296377113e-06, "loss": 1.0431, "step": 23468 }, { "epoch": 0.71, "learning_rate": 1.0436508639340923e-06, "loss": 1.1453, "step": 23469 }, { "epoch": 0.71, "learning_rate": 1.0434526120942168e-06, "loss": 1.1777, "step": 23470 }, { "epoch": 0.71, "learning_rate": 1.0432543741199698e-06, "loss": 1.0029, "step": 23471 }, { "epoch": 0.71, "learning_rate": 1.0430561500132397e-06, "loss": 1.1893, "step": 23472 }, { "epoch": 0.71, "learning_rate": 1.0428579397759133e-06, "loss": 1.0161, "step": 23473 }, { "epoch": 0.71, "learning_rate": 1.0426597434098784e-06, "loss": 1.1451, "step": 23474 }, { "epoch": 0.71, "learning_rate": 1.0424615609170202e-06, "loss": 1.0479, "step": 23475 }, { "epoch": 0.71, "learning_rate": 1.0422633922992255e-06, "loss": 1.1328, "step": 23476 }, { "epoch": 0.71, "learning_rate": 1.0420652375583816e-06, "loss": 1.0363, "step": 23477 }, { "epoch": 0.71, "learning_rate": 1.0418670966963756e-06, "loss": 1.0656, "step": 23478 }, { "epoch": 0.71, "learning_rate": 1.0416689697150914e-06, "loss": 1.0886, "step": 23479 }, { "epoch": 0.71, "learning_rate": 1.0414708566164162e-06, "loss": 1.0592, "step": 23480 }, { "epoch": 0.71, "learning_rate": 1.041272757402236e-06, "loss": 1.1847, "step": 23481 }, { "epoch": 0.71, "learning_rate": 1.0410746720744367e-06, "loss": 1.0926, "step": 23482 }, { "epoch": 0.71, "learning_rate": 1.0408766006349047e-06, "loss": 1.1165, "step": 23483 }, { "epoch": 0.71, "learning_rate": 1.0406785430855237e-06, "loss": 1.0848, "step": 23484 }, { "epoch": 0.71, "learning_rate": 1.0404804994281804e-06, "loss": 1.0798, "step": 23485 }, { "epoch": 0.71, "learning_rate": 1.0402824696647596e-06, "loss": 1.1263, "step": 23486 }, { "epoch": 0.71, "learning_rate": 1.040084453797147e-06, "loss": 0.9749, "step": 23487 }, { "epoch": 0.71, "learning_rate": 1.0398864518272266e-06, "loss": 1.0593, "step": 23488 }, { "epoch": 0.71, "learning_rate": 1.0396884637568855e-06, "loss": 1.2388, "step": 23489 }, { "epoch": 0.71, "learning_rate": 1.039490489588006e-06, "loss": 1.0173, "step": 23490 }, { "epoch": 0.71, "learning_rate": 1.0392925293224731e-06, "loss": 1.0393, "step": 23491 }, { "epoch": 0.71, "learning_rate": 1.0390945829621724e-06, "loss": 1.1631, "step": 23492 }, { "epoch": 0.71, "learning_rate": 1.0388966505089872e-06, "loss": 1.1199, "step": 23493 }, { "epoch": 0.71, "learning_rate": 1.0386987319648026e-06, "loss": 0.9772, "step": 23494 }, { "epoch": 0.71, "learning_rate": 1.0385008273315022e-06, "loss": 1.059, "step": 23495 }, { "epoch": 0.71, "learning_rate": 1.038302936610971e-06, "loss": 1.0353, "step": 23496 }, { "epoch": 0.71, "learning_rate": 1.0381050598050907e-06, "loss": 1.1812, "step": 23497 }, { "epoch": 0.71, "learning_rate": 1.037907196915746e-06, "loss": 1.1795, "step": 23498 }, { "epoch": 0.71, "learning_rate": 1.0377093479448212e-06, "loss": 1.095, "step": 23499 }, { "epoch": 0.71, "learning_rate": 1.0375115128941998e-06, "loss": 1.1221, "step": 23500 }, { "epoch": 0.71, "learning_rate": 1.0373136917657633e-06, "loss": 0.9778, "step": 23501 }, { "epoch": 0.71, "learning_rate": 1.0371158845613963e-06, "loss": 1.0742, "step": 23502 }, { "epoch": 0.71, "learning_rate": 1.0369180912829815e-06, "loss": 1.0689, "step": 23503 }, { "epoch": 0.71, "learning_rate": 1.0367203119324027e-06, "loss": 1.0995, "step": 23504 }, { "epoch": 0.71, "learning_rate": 1.0365225465115408e-06, "loss": 1.0917, "step": 23505 }, { "epoch": 0.71, "learning_rate": 1.0363247950222793e-06, "loss": 1.1385, "step": 23506 }, { "epoch": 0.71, "learning_rate": 1.0361270574665012e-06, "loss": 0.9894, "step": 23507 }, { "epoch": 0.71, "learning_rate": 1.0359293338460882e-06, "loss": 1.0681, "step": 23508 }, { "epoch": 0.71, "learning_rate": 1.0357316241629236e-06, "loss": 1.0623, "step": 23509 }, { "epoch": 0.71, "learning_rate": 1.0355339284188882e-06, "loss": 1.1713, "step": 23510 }, { "epoch": 0.71, "learning_rate": 1.0353362466158641e-06, "loss": 1.0629, "step": 23511 }, { "epoch": 0.71, "learning_rate": 1.0351385787557338e-06, "loss": 1.1627, "step": 23512 }, { "epoch": 0.71, "learning_rate": 1.0349409248403798e-06, "loss": 1.1127, "step": 23513 }, { "epoch": 0.71, "learning_rate": 1.0347432848716813e-06, "loss": 1.2274, "step": 23514 }, { "epoch": 0.71, "learning_rate": 1.0345456588515212e-06, "loss": 0.9919, "step": 23515 }, { "epoch": 0.71, "learning_rate": 1.0343480467817807e-06, "loss": 1.1545, "step": 23516 }, { "epoch": 0.71, "learning_rate": 1.0341504486643409e-06, "loss": 1.0677, "step": 23517 }, { "epoch": 0.71, "learning_rate": 1.0339528645010828e-06, "loss": 1.0381, "step": 23518 }, { "epoch": 0.71, "learning_rate": 1.0337552942938872e-06, "loss": 1.1685, "step": 23519 }, { "epoch": 0.71, "learning_rate": 1.0335577380446352e-06, "loss": 1.0829, "step": 23520 }, { "epoch": 0.71, "learning_rate": 1.0333601957552072e-06, "loss": 1.03, "step": 23521 }, { "epoch": 0.71, "learning_rate": 1.0331626674274847e-06, "loss": 1.0574, "step": 23522 }, { "epoch": 0.71, "learning_rate": 1.0329651530633464e-06, "loss": 1.1439, "step": 23523 }, { "epoch": 0.71, "learning_rate": 1.0327676526646732e-06, "loss": 0.999, "step": 23524 }, { "epoch": 0.71, "learning_rate": 1.0325701662333451e-06, "loss": 1.0104, "step": 23525 }, { "epoch": 0.71, "learning_rate": 1.0323726937712436e-06, "loss": 1.0654, "step": 23526 }, { "epoch": 0.71, "learning_rate": 1.032175235280246e-06, "loss": 1.0747, "step": 23527 }, { "epoch": 0.71, "learning_rate": 1.0319777907622332e-06, "loss": 1.1288, "step": 23528 }, { "epoch": 0.71, "learning_rate": 1.0317803602190852e-06, "loss": 1.0201, "step": 23529 }, { "epoch": 0.71, "learning_rate": 1.0315829436526815e-06, "loss": 1.1627, "step": 23530 }, { "epoch": 0.71, "learning_rate": 1.0313855410649e-06, "loss": 1.0585, "step": 23531 }, { "epoch": 0.71, "learning_rate": 1.0311881524576214e-06, "loss": 1.1069, "step": 23532 }, { "epoch": 0.71, "learning_rate": 1.0309907778327239e-06, "loss": 1.1361, "step": 23533 }, { "epoch": 0.71, "learning_rate": 1.0307934171920866e-06, "loss": 1.0051, "step": 23534 }, { "epoch": 0.71, "learning_rate": 1.0305960705375892e-06, "loss": 1.107, "step": 23535 }, { "epoch": 0.71, "learning_rate": 1.0303987378711089e-06, "loss": 1.1726, "step": 23536 }, { "epoch": 0.71, "learning_rate": 1.0302014191945246e-06, "loss": 1.1594, "step": 23537 }, { "epoch": 0.71, "learning_rate": 1.030004114509715e-06, "loss": 1.069, "step": 23538 }, { "epoch": 0.71, "learning_rate": 1.029806823818559e-06, "loss": 1.1646, "step": 23539 }, { "epoch": 0.71, "learning_rate": 1.0296095471229333e-06, "loss": 1.1015, "step": 23540 }, { "epoch": 0.71, "learning_rate": 1.0294122844247164e-06, "loss": 1.0965, "step": 23541 }, { "epoch": 0.71, "learning_rate": 1.0292150357257866e-06, "loss": 1.1506, "step": 23542 }, { "epoch": 0.71, "learning_rate": 1.029017801028021e-06, "loss": 1.2209, "step": 23543 }, { "epoch": 0.71, "learning_rate": 1.0288205803332976e-06, "loss": 1.1109, "step": 23544 }, { "epoch": 0.71, "learning_rate": 1.0286233736434936e-06, "loss": 1.1701, "step": 23545 }, { "epoch": 0.71, "learning_rate": 1.0284261809604865e-06, "loss": 1.0919, "step": 23546 }, { "epoch": 0.71, "learning_rate": 1.0282290022861543e-06, "loss": 1.082, "step": 23547 }, { "epoch": 0.71, "learning_rate": 1.0280318376223724e-06, "loss": 1.2153, "step": 23548 }, { "epoch": 0.71, "learning_rate": 1.0278346869710184e-06, "loss": 1.1623, "step": 23549 }, { "epoch": 0.71, "learning_rate": 1.0276375503339692e-06, "loss": 1.0772, "step": 23550 }, { "epoch": 0.71, "learning_rate": 1.0274404277131015e-06, "loss": 1.1295, "step": 23551 }, { "epoch": 0.71, "learning_rate": 1.0272433191102924e-06, "loss": 1.152, "step": 23552 }, { "epoch": 0.71, "learning_rate": 1.0270462245274165e-06, "loss": 0.974, "step": 23553 }, { "epoch": 0.71, "learning_rate": 1.0268491439663516e-06, "loss": 0.975, "step": 23554 }, { "epoch": 0.71, "learning_rate": 1.0266520774289732e-06, "loss": 1.0199, "step": 23555 }, { "epoch": 0.71, "learning_rate": 1.0264550249171581e-06, "loss": 1.2222, "step": 23556 }, { "epoch": 0.71, "learning_rate": 1.026257986432781e-06, "loss": 1.1206, "step": 23557 }, { "epoch": 0.71, "learning_rate": 1.0260609619777178e-06, "loss": 1.0941, "step": 23558 }, { "epoch": 0.71, "learning_rate": 1.0258639515538446e-06, "loss": 1.0639, "step": 23559 }, { "epoch": 0.71, "learning_rate": 1.0256669551630372e-06, "loss": 1.1079, "step": 23560 }, { "epoch": 0.71, "learning_rate": 1.0254699728071696e-06, "loss": 1.1489, "step": 23561 }, { "epoch": 0.71, "learning_rate": 1.0252730044881178e-06, "loss": 1.1057, "step": 23562 }, { "epoch": 0.71, "learning_rate": 1.0250760502077567e-06, "loss": 0.9813, "step": 23563 }, { "epoch": 0.71, "learning_rate": 1.0248791099679611e-06, "loss": 1.1553, "step": 23564 }, { "epoch": 0.71, "learning_rate": 1.024682183770607e-06, "loss": 1.0409, "step": 23565 }, { "epoch": 0.71, "learning_rate": 1.0244852716175668e-06, "loss": 1.0739, "step": 23566 }, { "epoch": 0.71, "learning_rate": 1.0242883735107166e-06, "loss": 1.2073, "step": 23567 }, { "epoch": 0.71, "learning_rate": 1.02409148945193e-06, "loss": 1.1441, "step": 23568 }, { "epoch": 0.71, "learning_rate": 1.0238946194430818e-06, "loss": 1.106, "step": 23569 }, { "epoch": 0.71, "learning_rate": 1.0236977634860456e-06, "loss": 1.1781, "step": 23570 }, { "epoch": 0.71, "learning_rate": 1.023500921582697e-06, "loss": 1.2273, "step": 23571 }, { "epoch": 0.71, "learning_rate": 1.0233040937349073e-06, "loss": 1.0632, "step": 23572 }, { "epoch": 0.71, "learning_rate": 1.0231072799445519e-06, "loss": 1.1107, "step": 23573 }, { "epoch": 0.71, "learning_rate": 1.0229104802135034e-06, "loss": 1.1623, "step": 23574 }, { "epoch": 0.71, "learning_rate": 1.0227136945436358e-06, "loss": 1.0522, "step": 23575 }, { "epoch": 0.71, "learning_rate": 1.0225169229368226e-06, "loss": 1.1224, "step": 23576 }, { "epoch": 0.71, "learning_rate": 1.0223201653949362e-06, "loss": 1.0068, "step": 23577 }, { "epoch": 0.71, "learning_rate": 1.0221234219198516e-06, "loss": 1.0579, "step": 23578 }, { "epoch": 0.71, "learning_rate": 1.0219266925134391e-06, "loss": 1.2471, "step": 23579 }, { "epoch": 0.71, "learning_rate": 1.021729977177573e-06, "loss": 1.134, "step": 23580 }, { "epoch": 0.71, "learning_rate": 1.021533275914125e-06, "loss": 1.0911, "step": 23581 }, { "epoch": 0.71, "learning_rate": 1.0213365887249694e-06, "loss": 1.1682, "step": 23582 }, { "epoch": 0.71, "learning_rate": 1.0211399156119763e-06, "loss": 1.0493, "step": 23583 }, { "epoch": 0.71, "learning_rate": 1.0209432565770188e-06, "loss": 1.0312, "step": 23584 }, { "epoch": 0.71, "learning_rate": 1.0207466116219693e-06, "loss": 1.1511, "step": 23585 }, { "epoch": 0.71, "learning_rate": 1.0205499807487007e-06, "loss": 1.1259, "step": 23586 }, { "epoch": 0.71, "learning_rate": 1.0203533639590828e-06, "loss": 1.1055, "step": 23587 }, { "epoch": 0.71, "learning_rate": 1.0201567612549882e-06, "loss": 1.0787, "step": 23588 }, { "epoch": 0.71, "learning_rate": 1.0199601726382886e-06, "loss": 1.1356, "step": 23589 }, { "epoch": 0.71, "learning_rate": 1.019763598110855e-06, "loss": 1.0585, "step": 23590 }, { "epoch": 0.71, "learning_rate": 1.0195670376745604e-06, "loss": 1.1307, "step": 23591 }, { "epoch": 0.71, "learning_rate": 1.0193704913312735e-06, "loss": 1.1716, "step": 23592 }, { "epoch": 0.71, "learning_rate": 1.0191739590828665e-06, "loss": 1.1762, "step": 23593 }, { "epoch": 0.71, "learning_rate": 1.01897744093121e-06, "loss": 1.1147, "step": 23594 }, { "epoch": 0.71, "learning_rate": 1.018780936878176e-06, "loss": 1.0769, "step": 23595 }, { "epoch": 0.71, "learning_rate": 1.0185844469256331e-06, "loss": 1.1097, "step": 23596 }, { "epoch": 0.71, "learning_rate": 1.018387971075453e-06, "loss": 0.9634, "step": 23597 }, { "epoch": 0.71, "learning_rate": 1.0181915093295056e-06, "loss": 1.1552, "step": 23598 }, { "epoch": 0.71, "learning_rate": 1.0179950616896617e-06, "loss": 1.0605, "step": 23599 }, { "epoch": 0.71, "learning_rate": 1.0177986281577907e-06, "loss": 1.0333, "step": 23600 }, { "epoch": 0.71, "learning_rate": 1.017602208735763e-06, "loss": 1.0353, "step": 23601 }, { "epoch": 0.71, "learning_rate": 1.0174058034254485e-06, "loss": 1.1469, "step": 23602 }, { "epoch": 0.71, "learning_rate": 1.0172094122287165e-06, "loss": 1.1588, "step": 23603 }, { "epoch": 0.71, "learning_rate": 1.0170130351474379e-06, "loss": 1.1187, "step": 23604 }, { "epoch": 0.71, "learning_rate": 1.01681667218348e-06, "loss": 1.1302, "step": 23605 }, { "epoch": 0.71, "learning_rate": 1.0166203233387129e-06, "loss": 1.1318, "step": 23606 }, { "epoch": 0.71, "learning_rate": 1.016423988615006e-06, "loss": 1.1232, "step": 23607 }, { "epoch": 0.71, "learning_rate": 1.0162276680142292e-06, "loss": 1.0939, "step": 23608 }, { "epoch": 0.71, "learning_rate": 1.0160313615382495e-06, "loss": 1.0452, "step": 23609 }, { "epoch": 0.71, "learning_rate": 1.0158350691889363e-06, "loss": 1.0868, "step": 23610 }, { "epoch": 0.71, "learning_rate": 1.0156387909681586e-06, "loss": 1.1671, "step": 23611 }, { "epoch": 0.71, "learning_rate": 1.0154425268777857e-06, "loss": 1.1816, "step": 23612 }, { "epoch": 0.71, "learning_rate": 1.0152462769196838e-06, "loss": 1.0854, "step": 23613 }, { "epoch": 0.71, "learning_rate": 1.0150500410957223e-06, "loss": 1.1558, "step": 23614 }, { "epoch": 0.71, "learning_rate": 1.0148538194077696e-06, "loss": 1.1177, "step": 23615 }, { "epoch": 0.71, "learning_rate": 1.014657611857693e-06, "loss": 1.175, "step": 23616 }, { "epoch": 0.71, "learning_rate": 1.0144614184473613e-06, "loss": 1.0275, "step": 23617 }, { "epoch": 0.71, "learning_rate": 1.014265239178641e-06, "loss": 1.2281, "step": 23618 }, { "epoch": 0.71, "learning_rate": 1.0140690740533995e-06, "loss": 1.2523, "step": 23619 }, { "epoch": 0.71, "learning_rate": 1.013872923073505e-06, "loss": 1.1443, "step": 23620 }, { "epoch": 0.71, "learning_rate": 1.0136767862408257e-06, "loss": 1.1525, "step": 23621 }, { "epoch": 0.71, "learning_rate": 1.0134806635572263e-06, "loss": 1.0048, "step": 23622 }, { "epoch": 0.71, "learning_rate": 1.0132845550245755e-06, "loss": 1.0773, "step": 23623 }, { "epoch": 0.71, "learning_rate": 1.0130884606447392e-06, "loss": 1.3239, "step": 23624 }, { "epoch": 0.71, "learning_rate": 1.0128923804195847e-06, "loss": 1.1398, "step": 23625 }, { "epoch": 0.71, "learning_rate": 1.0126963143509787e-06, "loss": 1.0593, "step": 23626 }, { "epoch": 0.71, "learning_rate": 1.0125002624407876e-06, "loss": 1.155, "step": 23627 }, { "epoch": 0.71, "learning_rate": 1.0123042246908774e-06, "loss": 1.1263, "step": 23628 }, { "epoch": 0.71, "learning_rate": 1.0121082011031144e-06, "loss": 1.0592, "step": 23629 }, { "epoch": 0.71, "learning_rate": 1.0119121916793658e-06, "loss": 1.4125, "step": 23630 }, { "epoch": 0.71, "learning_rate": 1.0117161964214955e-06, "loss": 1.2554, "step": 23631 }, { "epoch": 0.71, "learning_rate": 1.0115202153313702e-06, "loss": 1.0433, "step": 23632 }, { "epoch": 0.71, "learning_rate": 1.0113242484108557e-06, "loss": 1.1638, "step": 23633 }, { "epoch": 0.71, "learning_rate": 1.0111282956618182e-06, "loss": 1.1559, "step": 23634 }, { "epoch": 0.71, "learning_rate": 1.0109323570861213e-06, "loss": 1.1687, "step": 23635 }, { "epoch": 0.71, "learning_rate": 1.0107364326856312e-06, "loss": 1.1348, "step": 23636 }, { "epoch": 0.71, "learning_rate": 1.010540522462213e-06, "loss": 0.9702, "step": 23637 }, { "epoch": 0.71, "learning_rate": 1.0103446264177327e-06, "loss": 1.0425, "step": 23638 }, { "epoch": 0.71, "learning_rate": 1.010148744554053e-06, "loss": 1.1664, "step": 23639 }, { "epoch": 0.71, "learning_rate": 1.0099528768730398e-06, "loss": 1.0812, "step": 23640 }, { "epoch": 0.71, "learning_rate": 1.0097570233765577e-06, "loss": 1.0308, "step": 23641 }, { "epoch": 0.71, "learning_rate": 1.009561184066471e-06, "loss": 0.9604, "step": 23642 }, { "epoch": 0.71, "learning_rate": 1.0093653589446447e-06, "loss": 1.1519, "step": 23643 }, { "epoch": 0.71, "learning_rate": 1.009169548012942e-06, "loss": 1.1882, "step": 23644 }, { "epoch": 0.71, "learning_rate": 1.0089737512732265e-06, "loss": 1.0898, "step": 23645 }, { "epoch": 0.71, "learning_rate": 1.008777968727363e-06, "loss": 1.0419, "step": 23646 }, { "epoch": 0.71, "learning_rate": 1.0085822003772157e-06, "loss": 1.106, "step": 23647 }, { "epoch": 0.71, "learning_rate": 1.008386446224647e-06, "loss": 1.0358, "step": 23648 }, { "epoch": 0.71, "learning_rate": 1.008190706271521e-06, "loss": 1.0561, "step": 23649 }, { "epoch": 0.71, "learning_rate": 1.007994980519701e-06, "loss": 1.0525, "step": 23650 }, { "epoch": 0.71, "learning_rate": 1.0077992689710498e-06, "loss": 1.167, "step": 23651 }, { "epoch": 0.71, "learning_rate": 1.0076035716274312e-06, "loss": 1.0029, "step": 23652 }, { "epoch": 0.71, "learning_rate": 1.0074078884907087e-06, "loss": 1.0712, "step": 23653 }, { "epoch": 0.71, "learning_rate": 1.0072122195627435e-06, "loss": 1.1158, "step": 23654 }, { "epoch": 0.71, "learning_rate": 1.0070165648453986e-06, "loss": 1.1033, "step": 23655 }, { "epoch": 0.71, "learning_rate": 1.0068209243405372e-06, "loss": 1.1296, "step": 23656 }, { "epoch": 0.71, "learning_rate": 1.0066252980500216e-06, "loss": 0.9584, "step": 23657 }, { "epoch": 0.71, "learning_rate": 1.0064296859757138e-06, "loss": 1.1628, "step": 23658 }, { "epoch": 0.71, "learning_rate": 1.0062340881194759e-06, "loss": 1.152, "step": 23659 }, { "epoch": 0.71, "learning_rate": 1.006038504483171e-06, "loss": 1.15, "step": 23660 }, { "epoch": 0.71, "learning_rate": 1.0058429350686594e-06, "loss": 1.1748, "step": 23661 }, { "epoch": 0.71, "learning_rate": 1.0056473798778033e-06, "loss": 1.1317, "step": 23662 }, { "epoch": 0.71, "learning_rate": 1.0054518389124645e-06, "loss": 1.1209, "step": 23663 }, { "epoch": 0.71, "learning_rate": 1.0052563121745052e-06, "loss": 1.062, "step": 23664 }, { "epoch": 0.71, "learning_rate": 1.005060799665785e-06, "loss": 1.1199, "step": 23665 }, { "epoch": 0.71, "learning_rate": 1.004865301388166e-06, "loss": 1.1119, "step": 23666 }, { "epoch": 0.71, "learning_rate": 1.0046698173435093e-06, "loss": 1.114, "step": 23667 }, { "epoch": 0.71, "learning_rate": 1.0044743475336757e-06, "loss": 1.119, "step": 23668 }, { "epoch": 0.71, "learning_rate": 1.004278891960527e-06, "loss": 1.1812, "step": 23669 }, { "epoch": 0.71, "learning_rate": 1.004083450625922e-06, "loss": 1.1054, "step": 23670 }, { "epoch": 0.71, "learning_rate": 1.0038880235317223e-06, "loss": 1.0406, "step": 23671 }, { "epoch": 0.71, "learning_rate": 1.0036926106797877e-06, "loss": 1.0864, "step": 23672 }, { "epoch": 0.71, "learning_rate": 1.0034972120719796e-06, "loss": 1.1399, "step": 23673 }, { "epoch": 0.71, "learning_rate": 1.0033018277101566e-06, "loss": 1.103, "step": 23674 }, { "epoch": 0.71, "learning_rate": 1.0031064575961797e-06, "loss": 1.1234, "step": 23675 }, { "epoch": 0.71, "learning_rate": 1.002911101731908e-06, "loss": 1.0983, "step": 23676 }, { "epoch": 0.71, "learning_rate": 1.0027157601192025e-06, "loss": 1.1908, "step": 23677 }, { "epoch": 0.71, "learning_rate": 1.002520432759921e-06, "loss": 1.012, "step": 23678 }, { "epoch": 0.71, "learning_rate": 1.002325119655924e-06, "loss": 1.1711, "step": 23679 }, { "epoch": 0.71, "learning_rate": 1.0021298208090703e-06, "loss": 0.9832, "step": 23680 }, { "epoch": 0.71, "learning_rate": 1.0019345362212194e-06, "loss": 1.1702, "step": 23681 }, { "epoch": 0.71, "learning_rate": 1.0017392658942302e-06, "loss": 1.0213, "step": 23682 }, { "epoch": 0.71, "learning_rate": 1.0015440098299614e-06, "loss": 1.1469, "step": 23683 }, { "epoch": 0.71, "learning_rate": 1.0013487680302723e-06, "loss": 1.1097, "step": 23684 }, { "epoch": 0.71, "learning_rate": 1.0011535404970208e-06, "loss": 1.1985, "step": 23685 }, { "epoch": 0.71, "learning_rate": 1.0009583272320669e-06, "loss": 1.0478, "step": 23686 }, { "epoch": 0.71, "learning_rate": 1.0007631282372667e-06, "loss": 1.0923, "step": 23687 }, { "epoch": 0.71, "learning_rate": 1.0005679435144794e-06, "loss": 1.2186, "step": 23688 }, { "epoch": 0.71, "learning_rate": 1.0003727730655633e-06, "loss": 1.1172, "step": 23689 }, { "epoch": 0.71, "learning_rate": 1.000177616892377e-06, "loss": 1.0956, "step": 23690 }, { "epoch": 0.71, "learning_rate": 9.999824749967766e-07, "loss": 1.1519, "step": 23691 }, { "epoch": 0.71, "learning_rate": 9.997873473806205e-07, "loss": 1.1171, "step": 23692 }, { "epoch": 0.71, "learning_rate": 9.995922340457664e-07, "loss": 1.1385, "step": 23693 }, { "epoch": 0.71, "learning_rate": 9.993971349940718e-07, "loss": 0.9581, "step": 23694 }, { "epoch": 0.71, "learning_rate": 9.992020502273944e-07, "loss": 1.013, "step": 23695 }, { "epoch": 0.71, "learning_rate": 9.990069797475897e-07, "loss": 1.0994, "step": 23696 }, { "epoch": 0.71, "learning_rate": 9.988119235565157e-07, "loss": 1.1201, "step": 23697 }, { "epoch": 0.71, "learning_rate": 9.986168816560293e-07, "loss": 1.2239, "step": 23698 }, { "epoch": 0.71, "learning_rate": 9.984218540479881e-07, "loss": 1.2667, "step": 23699 }, { "epoch": 0.71, "learning_rate": 9.982268407342467e-07, "loss": 1.1249, "step": 23700 }, { "epoch": 0.71, "learning_rate": 9.980318417166623e-07, "loss": 1.1387, "step": 23701 }, { "epoch": 0.71, "learning_rate": 9.978368569970915e-07, "loss": 1.0662, "step": 23702 }, { "epoch": 0.71, "learning_rate": 9.976418865773913e-07, "loss": 1.074, "step": 23703 }, { "epoch": 0.71, "learning_rate": 9.974469304594158e-07, "loss": 1.1099, "step": 23704 }, { "epoch": 0.71, "learning_rate": 9.972519886450218e-07, "loss": 1.0884, "step": 23705 }, { "epoch": 0.71, "learning_rate": 9.970570611360656e-07, "loss": 0.9838, "step": 23706 }, { "epoch": 0.71, "learning_rate": 9.968621479344018e-07, "loss": 0.9453, "step": 23707 }, { "epoch": 0.71, "learning_rate": 9.966672490418866e-07, "loss": 1.038, "step": 23708 }, { "epoch": 0.71, "learning_rate": 9.964723644603751e-07, "loss": 0.9315, "step": 23709 }, { "epoch": 0.71, "learning_rate": 9.962774941917227e-07, "loss": 1.0395, "step": 23710 }, { "epoch": 0.71, "learning_rate": 9.960826382377842e-07, "loss": 1.1429, "step": 23711 }, { "epoch": 0.71, "learning_rate": 9.958877966004158e-07, "loss": 1.2808, "step": 23712 }, { "epoch": 0.71, "learning_rate": 9.956929692814698e-07, "loss": 1.1006, "step": 23713 }, { "epoch": 0.71, "learning_rate": 9.954981562828026e-07, "loss": 1.0888, "step": 23714 }, { "epoch": 0.71, "learning_rate": 9.953033576062685e-07, "loss": 1.0793, "step": 23715 }, { "epoch": 0.71, "learning_rate": 9.951085732537222e-07, "loss": 1.1275, "step": 23716 }, { "epoch": 0.71, "learning_rate": 9.949138032270169e-07, "loss": 1.0974, "step": 23717 }, { "epoch": 0.71, "learning_rate": 9.947190475280072e-07, "loss": 1.1371, "step": 23718 }, { "epoch": 0.71, "learning_rate": 9.945243061585475e-07, "loss": 1.1113, "step": 23719 }, { "epoch": 0.71, "learning_rate": 9.94329579120492e-07, "loss": 1.1683, "step": 23720 }, { "epoch": 0.71, "learning_rate": 9.941348664156926e-07, "loss": 1.173, "step": 23721 }, { "epoch": 0.71, "learning_rate": 9.939401680460044e-07, "loss": 1.1129, "step": 23722 }, { "epoch": 0.71, "learning_rate": 9.937454840132804e-07, "loss": 1.1395, "step": 23723 }, { "epoch": 0.71, "learning_rate": 9.93550814319374e-07, "loss": 1.1565, "step": 23724 }, { "epoch": 0.71, "learning_rate": 9.93356158966139e-07, "loss": 1.0679, "step": 23725 }, { "epoch": 0.71, "learning_rate": 9.931615179554268e-07, "loss": 1.1533, "step": 23726 }, { "epoch": 0.71, "learning_rate": 9.929668912890916e-07, "loss": 0.952, "step": 23727 }, { "epoch": 0.71, "learning_rate": 9.927722789689856e-07, "loss": 1.0813, "step": 23728 }, { "epoch": 0.71, "learning_rate": 9.925776809969622e-07, "loss": 1.0745, "step": 23729 }, { "epoch": 0.71, "learning_rate": 9.923830973748726e-07, "loss": 1.0531, "step": 23730 }, { "epoch": 0.71, "learning_rate": 9.921885281045701e-07, "loss": 1.1324, "step": 23731 }, { "epoch": 0.71, "learning_rate": 9.919939731879063e-07, "loss": 0.9481, "step": 23732 }, { "epoch": 0.71, "learning_rate": 9.917994326267335e-07, "loss": 1.0092, "step": 23733 }, { "epoch": 0.71, "learning_rate": 9.91604906422904e-07, "loss": 1.1572, "step": 23734 }, { "epoch": 0.72, "learning_rate": 9.914103945782693e-07, "loss": 0.9927, "step": 23735 }, { "epoch": 0.72, "learning_rate": 9.912158970946819e-07, "loss": 1.0968, "step": 23736 }, { "epoch": 0.72, "learning_rate": 9.910214139739915e-07, "loss": 1.1196, "step": 23737 }, { "epoch": 0.72, "learning_rate": 9.908269452180508e-07, "loss": 1.0112, "step": 23738 }, { "epoch": 0.72, "learning_rate": 9.906324908287104e-07, "loss": 1.1281, "step": 23739 }, { "epoch": 0.72, "learning_rate": 9.904380508078221e-07, "loss": 1.1495, "step": 23740 }, { "epoch": 0.72, "learning_rate": 9.902436251572362e-07, "loss": 1.1946, "step": 23741 }, { "epoch": 0.72, "learning_rate": 9.900492138788049e-07, "loss": 1.1575, "step": 23742 }, { "epoch": 0.72, "learning_rate": 9.898548169743768e-07, "loss": 1.1998, "step": 23743 }, { "epoch": 0.72, "learning_rate": 9.896604344458039e-07, "loss": 1.1612, "step": 23744 }, { "epoch": 0.72, "learning_rate": 9.89466066294936e-07, "loss": 1.0616, "step": 23745 }, { "epoch": 0.72, "learning_rate": 9.892717125236246e-07, "loss": 1.0905, "step": 23746 }, { "epoch": 0.72, "learning_rate": 9.89077373133718e-07, "loss": 1.069, "step": 23747 }, { "epoch": 0.72, "learning_rate": 9.88883048127067e-07, "loss": 1.2089, "step": 23748 }, { "epoch": 0.72, "learning_rate": 9.886887375055218e-07, "loss": 1.1626, "step": 23749 }, { "epoch": 0.72, "learning_rate": 9.88494441270932e-07, "loss": 1.0533, "step": 23750 }, { "epoch": 0.72, "learning_rate": 9.883001594251478e-07, "loss": 1.0909, "step": 23751 }, { "epoch": 0.72, "learning_rate": 9.881058919700173e-07, "loss": 1.048, "step": 23752 }, { "epoch": 0.72, "learning_rate": 9.879116389073906e-07, "loss": 0.9765, "step": 23753 }, { "epoch": 0.72, "learning_rate": 9.877174002391167e-07, "loss": 1.0945, "step": 23754 }, { "epoch": 0.72, "learning_rate": 9.875231759670456e-07, "loss": 1.1637, "step": 23755 }, { "epoch": 0.72, "learning_rate": 9.873289660930249e-07, "loss": 1.2693, "step": 23756 }, { "epoch": 0.72, "learning_rate": 9.871347706189036e-07, "loss": 1.0656, "step": 23757 }, { "epoch": 0.72, "learning_rate": 9.869405895465308e-07, "loss": 1.0799, "step": 23758 }, { "epoch": 0.72, "learning_rate": 9.867464228777557e-07, "loss": 0.9847, "step": 23759 }, { "epoch": 0.72, "learning_rate": 9.86552270614425e-07, "loss": 1.1434, "step": 23760 }, { "epoch": 0.72, "learning_rate": 9.863581327583877e-07, "loss": 1.1978, "step": 23761 }, { "epoch": 0.72, "learning_rate": 9.86164009311492e-07, "loss": 1.1388, "step": 23762 }, { "epoch": 0.72, "learning_rate": 9.85969900275586e-07, "loss": 1.1425, "step": 23763 }, { "epoch": 0.72, "learning_rate": 9.857758056525175e-07, "loss": 1.0347, "step": 23764 }, { "epoch": 0.72, "learning_rate": 9.855817254441335e-07, "loss": 1.0932, "step": 23765 }, { "epoch": 0.72, "learning_rate": 9.853876596522826e-07, "loss": 1.2066, "step": 23766 }, { "epoch": 0.72, "learning_rate": 9.851936082788117e-07, "loss": 1.1162, "step": 23767 }, { "epoch": 0.72, "learning_rate": 9.849995713255687e-07, "loss": 1.1041, "step": 23768 }, { "epoch": 0.72, "learning_rate": 9.848055487943995e-07, "loss": 1.1454, "step": 23769 }, { "epoch": 0.72, "learning_rate": 9.846115406871515e-07, "loss": 1.0428, "step": 23770 }, { "epoch": 0.72, "learning_rate": 9.844175470056718e-07, "loss": 1.1536, "step": 23771 }, { "epoch": 0.72, "learning_rate": 9.84223567751808e-07, "loss": 1.0558, "step": 23772 }, { "epoch": 0.72, "learning_rate": 9.840296029274052e-07, "loss": 1.0891, "step": 23773 }, { "epoch": 0.72, "learning_rate": 9.8383565253431e-07, "loss": 1.0204, "step": 23774 }, { "epoch": 0.72, "learning_rate": 9.836417165743698e-07, "loss": 1.0525, "step": 23775 }, { "epoch": 0.72, "learning_rate": 9.834477950494297e-07, "loss": 1.11, "step": 23776 }, { "epoch": 0.72, "learning_rate": 9.832538879613374e-07, "loss": 1.1151, "step": 23777 }, { "epoch": 0.72, "learning_rate": 9.830599953119364e-07, "loss": 1.1135, "step": 23778 }, { "epoch": 0.72, "learning_rate": 9.828661171030737e-07, "loss": 1.0287, "step": 23779 }, { "epoch": 0.72, "learning_rate": 9.826722533365952e-07, "loss": 1.1299, "step": 23780 }, { "epoch": 0.72, "learning_rate": 9.824784040143468e-07, "loss": 1.2086, "step": 23781 }, { "epoch": 0.72, "learning_rate": 9.82284569138172e-07, "loss": 1.0612, "step": 23782 }, { "epoch": 0.72, "learning_rate": 9.820907487099174e-07, "loss": 1.0988, "step": 23783 }, { "epoch": 0.72, "learning_rate": 9.818969427314276e-07, "loss": 1.0797, "step": 23784 }, { "epoch": 0.72, "learning_rate": 9.817031512045489e-07, "loss": 1.0542, "step": 23785 }, { "epoch": 0.72, "learning_rate": 9.81509374131124e-07, "loss": 1.0469, "step": 23786 }, { "epoch": 0.72, "learning_rate": 9.813156115129985e-07, "loss": 1.1118, "step": 23787 }, { "epoch": 0.72, "learning_rate": 9.81121863352017e-07, "loss": 1.0419, "step": 23788 }, { "epoch": 0.72, "learning_rate": 9.809281296500237e-07, "loss": 1.1415, "step": 23789 }, { "epoch": 0.72, "learning_rate": 9.80734410408863e-07, "loss": 1.0787, "step": 23790 }, { "epoch": 0.72, "learning_rate": 9.805407056303792e-07, "loss": 1.1349, "step": 23791 }, { "epoch": 0.72, "learning_rate": 9.80347015316416e-07, "loss": 1.1937, "step": 23792 }, { "epoch": 0.72, "learning_rate": 9.801533394688173e-07, "loss": 1.1207, "step": 23793 }, { "epoch": 0.72, "learning_rate": 9.799596780894276e-07, "loss": 1.0194, "step": 23794 }, { "epoch": 0.72, "learning_rate": 9.797660311800892e-07, "loss": 1.1754, "step": 23795 }, { "epoch": 0.72, "learning_rate": 9.795723987426456e-07, "loss": 1.1268, "step": 23796 }, { "epoch": 0.72, "learning_rate": 9.793787807789406e-07, "loss": 1.1639, "step": 23797 }, { "epoch": 0.72, "learning_rate": 9.791851772908182e-07, "loss": 1.1062, "step": 23798 }, { "epoch": 0.72, "learning_rate": 9.789915882801196e-07, "loss": 1.1361, "step": 23799 }, { "epoch": 0.72, "learning_rate": 9.787980137486886e-07, "loss": 1.0821, "step": 23800 }, { "epoch": 0.72, "learning_rate": 9.786044536983676e-07, "loss": 1.1869, "step": 23801 }, { "epoch": 0.72, "learning_rate": 9.784109081309998e-07, "loss": 1.0593, "step": 23802 }, { "epoch": 0.72, "learning_rate": 9.782173770484279e-07, "loss": 1.0964, "step": 23803 }, { "epoch": 0.72, "learning_rate": 9.78023860452493e-07, "loss": 1.1116, "step": 23804 }, { "epoch": 0.72, "learning_rate": 9.77830358345038e-07, "loss": 1.129, "step": 23805 }, { "epoch": 0.72, "learning_rate": 9.776368707279046e-07, "loss": 1.2009, "step": 23806 }, { "epoch": 0.72, "learning_rate": 9.77443397602936e-07, "loss": 1.1437, "step": 23807 }, { "epoch": 0.72, "learning_rate": 9.772499389719722e-07, "loss": 1.043, "step": 23808 }, { "epoch": 0.72, "learning_rate": 9.770564948368555e-07, "loss": 1.0917, "step": 23809 }, { "epoch": 0.72, "learning_rate": 9.768630651994274e-07, "loss": 1.1315, "step": 23810 }, { "epoch": 0.72, "learning_rate": 9.766696500615305e-07, "loss": 1.0987, "step": 23811 }, { "epoch": 0.72, "learning_rate": 9.764762494250039e-07, "loss": 1.1215, "step": 23812 }, { "epoch": 0.72, "learning_rate": 9.762828632916894e-07, "loss": 1.1405, "step": 23813 }, { "epoch": 0.72, "learning_rate": 9.760894916634283e-07, "loss": 1.1593, "step": 23814 }, { "epoch": 0.72, "learning_rate": 9.758961345420615e-07, "loss": 1.1445, "step": 23815 }, { "epoch": 0.72, "learning_rate": 9.757027919294292e-07, "loss": 1.1339, "step": 23816 }, { "epoch": 0.72, "learning_rate": 9.755094638273724e-07, "loss": 1.0607, "step": 23817 }, { "epoch": 0.72, "learning_rate": 9.75316150237732e-07, "loss": 1.2789, "step": 23818 }, { "epoch": 0.72, "learning_rate": 9.75122851162347e-07, "loss": 1.1679, "step": 23819 }, { "epoch": 0.72, "learning_rate": 9.749295666030579e-07, "loss": 1.2177, "step": 23820 }, { "epoch": 0.72, "learning_rate": 9.747362965617047e-07, "loss": 1.1142, "step": 23821 }, { "epoch": 0.72, "learning_rate": 9.745430410401272e-07, "loss": 1.096, "step": 23822 }, { "epoch": 0.72, "learning_rate": 9.743498000401654e-07, "loss": 1.2077, "step": 23823 }, { "epoch": 0.72, "learning_rate": 9.741565735636598e-07, "loss": 1.1057, "step": 23824 }, { "epoch": 0.72, "learning_rate": 9.739633616124477e-07, "loss": 1.1566, "step": 23825 }, { "epoch": 0.72, "learning_rate": 9.737701641883696e-07, "loss": 1.1545, "step": 23826 }, { "epoch": 0.72, "learning_rate": 9.735769812932641e-07, "loss": 1.0376, "step": 23827 }, { "epoch": 0.72, "learning_rate": 9.733838129289711e-07, "loss": 1.0365, "step": 23828 }, { "epoch": 0.72, "learning_rate": 9.731906590973295e-07, "loss": 1.0284, "step": 23829 }, { "epoch": 0.72, "learning_rate": 9.729975198001764e-07, "loss": 1.0607, "step": 23830 }, { "epoch": 0.72, "learning_rate": 9.72804395039352e-07, "loss": 1.1256, "step": 23831 }, { "epoch": 0.72, "learning_rate": 9.72611284816694e-07, "loss": 1.1748, "step": 23832 }, { "epoch": 0.72, "learning_rate": 9.724181891340417e-07, "loss": 1.0765, "step": 23833 }, { "epoch": 0.72, "learning_rate": 9.722251079932318e-07, "loss": 1.0203, "step": 23834 }, { "epoch": 0.72, "learning_rate": 9.720320413961031e-07, "loss": 1.0692, "step": 23835 }, { "epoch": 0.72, "learning_rate": 9.718389893444934e-07, "loss": 1.066, "step": 23836 }, { "epoch": 0.72, "learning_rate": 9.716459518402415e-07, "loss": 1.1594, "step": 23837 }, { "epoch": 0.72, "learning_rate": 9.714529288851832e-07, "loss": 1.1533, "step": 23838 }, { "epoch": 0.72, "learning_rate": 9.712599204811569e-07, "loss": 1.0523, "step": 23839 }, { "epoch": 0.72, "learning_rate": 9.710669266299996e-07, "loss": 1.0262, "step": 23840 }, { "epoch": 0.72, "learning_rate": 9.708739473335488e-07, "loss": 1.0824, "step": 23841 }, { "epoch": 0.72, "learning_rate": 9.706809825936427e-07, "loss": 1.0878, "step": 23842 }, { "epoch": 0.72, "learning_rate": 9.704880324121161e-07, "loss": 1.2216, "step": 23843 }, { "epoch": 0.72, "learning_rate": 9.702950967908067e-07, "loss": 1.1667, "step": 23844 }, { "epoch": 0.72, "learning_rate": 9.701021757315514e-07, "loss": 1.0847, "step": 23845 }, { "epoch": 0.72, "learning_rate": 9.699092692361867e-07, "loss": 1.1254, "step": 23846 }, { "epoch": 0.72, "learning_rate": 9.697163773065484e-07, "loss": 1.0761, "step": 23847 }, { "epoch": 0.72, "learning_rate": 9.695234999444735e-07, "loss": 1.1628, "step": 23848 }, { "epoch": 0.72, "learning_rate": 9.693306371517977e-07, "loss": 1.0703, "step": 23849 }, { "epoch": 0.72, "learning_rate": 9.69137788930358e-07, "loss": 1.176, "step": 23850 }, { "epoch": 0.72, "learning_rate": 9.689449552819881e-07, "loss": 1.0416, "step": 23851 }, { "epoch": 0.72, "learning_rate": 9.687521362085253e-07, "loss": 1.1237, "step": 23852 }, { "epoch": 0.72, "learning_rate": 9.685593317118044e-07, "loss": 1.1196, "step": 23853 }, { "epoch": 0.72, "learning_rate": 9.683665417936614e-07, "loss": 1.0607, "step": 23854 }, { "epoch": 0.72, "learning_rate": 9.681737664559318e-07, "loss": 1.1573, "step": 23855 }, { "epoch": 0.72, "learning_rate": 9.679810057004494e-07, "loss": 1.1243, "step": 23856 }, { "epoch": 0.72, "learning_rate": 9.6778825952905e-07, "loss": 1.0934, "step": 23857 }, { "epoch": 0.72, "learning_rate": 9.675955279435683e-07, "loss": 1.0911, "step": 23858 }, { "epoch": 0.72, "learning_rate": 9.674028109458403e-07, "loss": 1.2061, "step": 23859 }, { "epoch": 0.72, "learning_rate": 9.67210108537698e-07, "loss": 1.2046, "step": 23860 }, { "epoch": 0.72, "learning_rate": 9.670174207209778e-07, "loss": 1.165, "step": 23861 }, { "epoch": 0.72, "learning_rate": 9.668247474975134e-07, "loss": 1.0321, "step": 23862 }, { "epoch": 0.72, "learning_rate": 9.666320888691396e-07, "loss": 1.106, "step": 23863 }, { "epoch": 0.72, "learning_rate": 9.66439444837689e-07, "loss": 1.2202, "step": 23864 }, { "epoch": 0.72, "learning_rate": 9.662468154049964e-07, "loss": 1.0917, "step": 23865 }, { "epoch": 0.72, "learning_rate": 9.660542005728954e-07, "loss": 1.1539, "step": 23866 }, { "epoch": 0.72, "learning_rate": 9.658616003432198e-07, "loss": 1.2776, "step": 23867 }, { "epoch": 0.72, "learning_rate": 9.656690147178036e-07, "loss": 1.1431, "step": 23868 }, { "epoch": 0.72, "learning_rate": 9.654764436984787e-07, "loss": 1.1946, "step": 23869 }, { "epoch": 0.72, "learning_rate": 9.652838872870787e-07, "loss": 1.0553, "step": 23870 }, { "epoch": 0.72, "learning_rate": 9.65091345485437e-07, "loss": 1.1232, "step": 23871 }, { "epoch": 0.72, "learning_rate": 9.648988182953867e-07, "loss": 0.9994, "step": 23872 }, { "epoch": 0.72, "learning_rate": 9.647063057187603e-07, "loss": 1.1211, "step": 23873 }, { "epoch": 0.72, "learning_rate": 9.645138077573904e-07, "loss": 1.1555, "step": 23874 }, { "epoch": 0.72, "learning_rate": 9.643213244131095e-07, "loss": 1.036, "step": 23875 }, { "epoch": 0.72, "learning_rate": 9.641288556877507e-07, "loss": 1.1652, "step": 23876 }, { "epoch": 0.72, "learning_rate": 9.63936401583145e-07, "loss": 1.0464, "step": 23877 }, { "epoch": 0.72, "learning_rate": 9.637439621011243e-07, "loss": 1.0198, "step": 23878 }, { "epoch": 0.72, "learning_rate": 9.635515372435216e-07, "loss": 1.1317, "step": 23879 }, { "epoch": 0.72, "learning_rate": 9.633591270121683e-07, "loss": 1.1442, "step": 23880 }, { "epoch": 0.72, "learning_rate": 9.631667314088972e-07, "loss": 1.1216, "step": 23881 }, { "epoch": 0.72, "learning_rate": 9.629743504355374e-07, "loss": 1.1048, "step": 23882 }, { "epoch": 0.72, "learning_rate": 9.627819840939218e-07, "loss": 1.0464, "step": 23883 }, { "epoch": 0.72, "learning_rate": 9.62589632385881e-07, "loss": 1.1092, "step": 23884 }, { "epoch": 0.72, "learning_rate": 9.623972953132477e-07, "loss": 1.1306, "step": 23885 }, { "epoch": 0.72, "learning_rate": 9.622049728778505e-07, "loss": 1.1881, "step": 23886 }, { "epoch": 0.72, "learning_rate": 9.620126650815212e-07, "loss": 1.115, "step": 23887 }, { "epoch": 0.72, "learning_rate": 9.618203719260907e-07, "loss": 0.9645, "step": 23888 }, { "epoch": 0.72, "learning_rate": 9.616280934133906e-07, "loss": 1.1031, "step": 23889 }, { "epoch": 0.72, "learning_rate": 9.614358295452492e-07, "loss": 1.0917, "step": 23890 }, { "epoch": 0.72, "learning_rate": 9.612435803234972e-07, "loss": 1.1267, "step": 23891 }, { "epoch": 0.72, "learning_rate": 9.61051345749966e-07, "loss": 1.131, "step": 23892 }, { "epoch": 0.72, "learning_rate": 9.608591258264844e-07, "loss": 1.1497, "step": 23893 }, { "epoch": 0.72, "learning_rate": 9.606669205548835e-07, "loss": 1.0727, "step": 23894 }, { "epoch": 0.72, "learning_rate": 9.604747299369913e-07, "loss": 1.0363, "step": 23895 }, { "epoch": 0.72, "learning_rate": 9.602825539746383e-07, "loss": 1.0604, "step": 23896 }, { "epoch": 0.72, "learning_rate": 9.600903926696537e-07, "loss": 1.0261, "step": 23897 }, { "epoch": 0.72, "learning_rate": 9.598982460238667e-07, "loss": 1.0427, "step": 23898 }, { "epoch": 0.72, "learning_rate": 9.59706114039107e-07, "loss": 1.1592, "step": 23899 }, { "epoch": 0.72, "learning_rate": 9.595139967172042e-07, "loss": 1.1979, "step": 23900 }, { "epoch": 0.72, "learning_rate": 9.593218940599853e-07, "loss": 1.0121, "step": 23901 }, { "epoch": 0.72, "learning_rate": 9.591298060692796e-07, "loss": 1.1774, "step": 23902 }, { "epoch": 0.72, "learning_rate": 9.589377327469165e-07, "loss": 1.1171, "step": 23903 }, { "epoch": 0.72, "learning_rate": 9.587456740947238e-07, "loss": 1.1619, "step": 23904 }, { "epoch": 0.72, "learning_rate": 9.5855363011453e-07, "loss": 1.0967, "step": 23905 }, { "epoch": 0.72, "learning_rate": 9.583616008081641e-07, "loss": 1.2237, "step": 23906 }, { "epoch": 0.72, "learning_rate": 9.581695861774523e-07, "loss": 1.0556, "step": 23907 }, { "epoch": 0.72, "learning_rate": 9.579775862242238e-07, "loss": 1.0763, "step": 23908 }, { "epoch": 0.72, "learning_rate": 9.577856009503056e-07, "loss": 1.0258, "step": 23909 }, { "epoch": 0.72, "learning_rate": 9.575936303575262e-07, "loss": 1.0667, "step": 23910 }, { "epoch": 0.72, "learning_rate": 9.574016744477129e-07, "loss": 1.1476, "step": 23911 }, { "epoch": 0.72, "learning_rate": 9.572097332226923e-07, "loss": 1.1307, "step": 23912 }, { "epoch": 0.72, "learning_rate": 9.57017806684292e-07, "loss": 1.2097, "step": 23913 }, { "epoch": 0.72, "learning_rate": 9.568258948343387e-07, "loss": 1.1494, "step": 23914 }, { "epoch": 0.72, "learning_rate": 9.566339976746607e-07, "loss": 1.0492, "step": 23915 }, { "epoch": 0.72, "learning_rate": 9.564421152070829e-07, "loss": 0.9939, "step": 23916 }, { "epoch": 0.72, "learning_rate": 9.562502474334328e-07, "loss": 1.2317, "step": 23917 }, { "epoch": 0.72, "learning_rate": 9.560583943555369e-07, "loss": 1.1129, "step": 23918 }, { "epoch": 0.72, "learning_rate": 9.558665559752222e-07, "loss": 1.1301, "step": 23919 }, { "epoch": 0.72, "learning_rate": 9.556747322943133e-07, "loss": 1.1495, "step": 23920 }, { "epoch": 0.72, "learning_rate": 9.554829233146374e-07, "loss": 1.0057, "step": 23921 }, { "epoch": 0.72, "learning_rate": 9.552911290380202e-07, "loss": 1.067, "step": 23922 }, { "epoch": 0.72, "learning_rate": 9.550993494662872e-07, "loss": 1.1074, "step": 23923 }, { "epoch": 0.72, "learning_rate": 9.549075846012654e-07, "loss": 1.0966, "step": 23924 }, { "epoch": 0.72, "learning_rate": 9.547158344447785e-07, "loss": 1.0963, "step": 23925 }, { "epoch": 0.72, "learning_rate": 9.545240989986524e-07, "loss": 1.1088, "step": 23926 }, { "epoch": 0.72, "learning_rate": 9.543323782647127e-07, "loss": 1.1437, "step": 23927 }, { "epoch": 0.72, "learning_rate": 9.541406722447843e-07, "loss": 1.032, "step": 23928 }, { "epoch": 0.72, "learning_rate": 9.53948980940692e-07, "loss": 1.1111, "step": 23929 }, { "epoch": 0.72, "learning_rate": 9.537573043542612e-07, "loss": 1.0997, "step": 23930 }, { "epoch": 0.72, "learning_rate": 9.53565642487316e-07, "loss": 1.084, "step": 23931 }, { "epoch": 0.72, "learning_rate": 9.533739953416818e-07, "loss": 1.0665, "step": 23932 }, { "epoch": 0.72, "learning_rate": 9.531823629191816e-07, "loss": 1.162, "step": 23933 }, { "epoch": 0.72, "learning_rate": 9.529907452216403e-07, "loss": 1.084, "step": 23934 }, { "epoch": 0.72, "learning_rate": 9.52799142250882e-07, "loss": 0.9495, "step": 23935 }, { "epoch": 0.72, "learning_rate": 9.526075540087307e-07, "loss": 1.2548, "step": 23936 }, { "epoch": 0.72, "learning_rate": 9.524159804970109e-07, "loss": 1.1524, "step": 23937 }, { "epoch": 0.72, "learning_rate": 9.522244217175449e-07, "loss": 1.1098, "step": 23938 }, { "epoch": 0.72, "learning_rate": 9.520328776721572e-07, "loss": 1.0559, "step": 23939 }, { "epoch": 0.72, "learning_rate": 9.518413483626709e-07, "loss": 1.0495, "step": 23940 }, { "epoch": 0.72, "learning_rate": 9.5164983379091e-07, "loss": 1.0886, "step": 23941 }, { "epoch": 0.72, "learning_rate": 9.514583339586963e-07, "loss": 1.1843, "step": 23942 }, { "epoch": 0.72, "learning_rate": 9.512668488678534e-07, "loss": 1.0851, "step": 23943 }, { "epoch": 0.72, "learning_rate": 9.510753785202043e-07, "loss": 1.0381, "step": 23944 }, { "epoch": 0.72, "learning_rate": 9.508839229175724e-07, "loss": 1.0623, "step": 23945 }, { "epoch": 0.72, "learning_rate": 9.506924820617786e-07, "loss": 1.0067, "step": 23946 }, { "epoch": 0.72, "learning_rate": 9.50501055954646e-07, "loss": 1.193, "step": 23947 }, { "epoch": 0.72, "learning_rate": 9.503096445979973e-07, "loss": 1.0692, "step": 23948 }, { "epoch": 0.72, "learning_rate": 9.501182479936544e-07, "loss": 1.1329, "step": 23949 }, { "epoch": 0.72, "learning_rate": 9.499268661434402e-07, "loss": 1.1351, "step": 23950 }, { "epoch": 0.72, "learning_rate": 9.497354990491747e-07, "loss": 1.091, "step": 23951 }, { "epoch": 0.72, "learning_rate": 9.495441467126806e-07, "loss": 1.1376, "step": 23952 }, { "epoch": 0.72, "learning_rate": 9.493528091357798e-07, "loss": 1.1678, "step": 23953 }, { "epoch": 0.72, "learning_rate": 9.491614863202933e-07, "loss": 1.1826, "step": 23954 }, { "epoch": 0.72, "learning_rate": 9.489701782680425e-07, "loss": 1.11, "step": 23955 }, { "epoch": 0.72, "learning_rate": 9.487788849808486e-07, "loss": 1.1581, "step": 23956 }, { "epoch": 0.72, "learning_rate": 9.485876064605326e-07, "loss": 1.0583, "step": 23957 }, { "epoch": 0.72, "learning_rate": 9.483963427089162e-07, "loss": 1.1206, "step": 23958 }, { "epoch": 0.72, "learning_rate": 9.482050937278187e-07, "loss": 1.0605, "step": 23959 }, { "epoch": 0.72, "learning_rate": 9.480138595190611e-07, "loss": 1.1865, "step": 23960 }, { "epoch": 0.72, "learning_rate": 9.478226400844642e-07, "loss": 1.0717, "step": 23961 }, { "epoch": 0.72, "learning_rate": 9.476314354258481e-07, "loss": 0.9777, "step": 23962 }, { "epoch": 0.72, "learning_rate": 9.47440245545034e-07, "loss": 1.1663, "step": 23963 }, { "epoch": 0.72, "learning_rate": 9.472490704438403e-07, "loss": 1.0408, "step": 23964 }, { "epoch": 0.72, "learning_rate": 9.470579101240876e-07, "loss": 1.0328, "step": 23965 }, { "epoch": 0.72, "learning_rate": 9.468667645875957e-07, "loss": 1.1213, "step": 23966 }, { "epoch": 0.72, "learning_rate": 9.466756338361849e-07, "loss": 1.1242, "step": 23967 }, { "epoch": 0.72, "learning_rate": 9.46484517871673e-07, "loss": 1.1331, "step": 23968 }, { "epoch": 0.72, "learning_rate": 9.462934166958806e-07, "loss": 1.0668, "step": 23969 }, { "epoch": 0.72, "learning_rate": 9.461023303106265e-07, "loss": 1.2331, "step": 23970 }, { "epoch": 0.72, "learning_rate": 9.459112587177305e-07, "loss": 1.0651, "step": 23971 }, { "epoch": 0.72, "learning_rate": 9.457202019190101e-07, "loss": 1.0629, "step": 23972 }, { "epoch": 0.72, "learning_rate": 9.45529159916285e-07, "loss": 1.0604, "step": 23973 }, { "epoch": 0.72, "learning_rate": 9.453381327113733e-07, "loss": 1.0289, "step": 23974 }, { "epoch": 0.72, "learning_rate": 9.451471203060941e-07, "loss": 1.0992, "step": 23975 }, { "epoch": 0.72, "learning_rate": 9.449561227022664e-07, "loss": 1.118, "step": 23976 }, { "epoch": 0.72, "learning_rate": 9.447651399017063e-07, "loss": 1.0693, "step": 23977 }, { "epoch": 0.72, "learning_rate": 9.445741719062332e-07, "loss": 1.2012, "step": 23978 }, { "epoch": 0.72, "learning_rate": 9.443832187176647e-07, "loss": 1.11, "step": 23979 }, { "epoch": 0.72, "learning_rate": 9.441922803378189e-07, "loss": 1.11, "step": 23980 }, { "epoch": 0.72, "learning_rate": 9.440013567685132e-07, "loss": 1.0829, "step": 23981 }, { "epoch": 0.72, "learning_rate": 9.438104480115662e-07, "loss": 1.1224, "step": 23982 }, { "epoch": 0.72, "learning_rate": 9.436195540687934e-07, "loss": 0.9775, "step": 23983 }, { "epoch": 0.72, "learning_rate": 9.434286749420126e-07, "loss": 0.9801, "step": 23984 }, { "epoch": 0.72, "learning_rate": 9.432378106330415e-07, "loss": 1.1703, "step": 23985 }, { "epoch": 0.72, "learning_rate": 9.430469611436965e-07, "loss": 1.1444, "step": 23986 }, { "epoch": 0.72, "learning_rate": 9.428561264757946e-07, "loss": 1.183, "step": 23987 }, { "epoch": 0.72, "learning_rate": 9.426653066311522e-07, "loss": 1.0477, "step": 23988 }, { "epoch": 0.72, "learning_rate": 9.424745016115871e-07, "loss": 1.1205, "step": 23989 }, { "epoch": 0.72, "learning_rate": 9.42283711418914e-07, "loss": 1.0231, "step": 23990 }, { "epoch": 0.72, "learning_rate": 9.420929360549494e-07, "loss": 1.0942, "step": 23991 }, { "epoch": 0.72, "learning_rate": 9.419021755215099e-07, "loss": 1.1479, "step": 23992 }, { "epoch": 0.72, "learning_rate": 9.417114298204122e-07, "loss": 1.0361, "step": 23993 }, { "epoch": 0.72, "learning_rate": 9.415206989534701e-07, "loss": 1.1526, "step": 23994 }, { "epoch": 0.72, "learning_rate": 9.413299829225003e-07, "loss": 1.0489, "step": 23995 }, { "epoch": 0.72, "learning_rate": 9.411392817293188e-07, "loss": 1.1144, "step": 23996 }, { "epoch": 0.72, "learning_rate": 9.409485953757411e-07, "loss": 1.1225, "step": 23997 }, { "epoch": 0.72, "learning_rate": 9.407579238635811e-07, "loss": 1.1457, "step": 23998 }, { "epoch": 0.72, "learning_rate": 9.405672671946547e-07, "loss": 1.158, "step": 23999 }, { "epoch": 0.72, "learning_rate": 9.403766253707769e-07, "loss": 1.0867, "step": 24000 }, { "epoch": 0.72, "learning_rate": 9.401859983937625e-07, "loss": 1.0768, "step": 24001 }, { "epoch": 0.72, "learning_rate": 9.399953862654271e-07, "loss": 1.1613, "step": 24002 }, { "epoch": 0.72, "learning_rate": 9.398047889875833e-07, "loss": 1.0943, "step": 24003 }, { "epoch": 0.72, "learning_rate": 9.396142065620467e-07, "loss": 1.1418, "step": 24004 }, { "epoch": 0.72, "learning_rate": 9.394236389906311e-07, "loss": 1.0984, "step": 24005 }, { "epoch": 0.72, "learning_rate": 9.392330862751517e-07, "loss": 1.0609, "step": 24006 }, { "epoch": 0.72, "learning_rate": 9.390425484174209e-07, "loss": 1.0391, "step": 24007 }, { "epoch": 0.72, "learning_rate": 9.388520254192532e-07, "loss": 1.0977, "step": 24008 }, { "epoch": 0.72, "learning_rate": 9.386615172824626e-07, "loss": 1.1066, "step": 24009 }, { "epoch": 0.72, "learning_rate": 9.384710240088621e-07, "loss": 1.2231, "step": 24010 }, { "epoch": 0.72, "learning_rate": 9.382805456002656e-07, "loss": 0.9826, "step": 24011 }, { "epoch": 0.72, "learning_rate": 9.380900820584859e-07, "loss": 1.2366, "step": 24012 }, { "epoch": 0.72, "learning_rate": 9.378996333853362e-07, "loss": 1.1273, "step": 24013 }, { "epoch": 0.72, "learning_rate": 9.377091995826301e-07, "loss": 1.043, "step": 24014 }, { "epoch": 0.72, "learning_rate": 9.375187806521807e-07, "loss": 1.0423, "step": 24015 }, { "epoch": 0.72, "learning_rate": 9.373283765957991e-07, "loss": 1.0191, "step": 24016 }, { "epoch": 0.72, "learning_rate": 9.371379874152989e-07, "loss": 1.11, "step": 24017 }, { "epoch": 0.72, "learning_rate": 9.369476131124921e-07, "loss": 1.0978, "step": 24018 }, { "epoch": 0.72, "learning_rate": 9.367572536891922e-07, "loss": 1.2517, "step": 24019 }, { "epoch": 0.72, "learning_rate": 9.365669091472097e-07, "loss": 1.1354, "step": 24020 }, { "epoch": 0.72, "learning_rate": 9.36376579488357e-07, "loss": 1.0607, "step": 24021 }, { "epoch": 0.72, "learning_rate": 9.361862647144462e-07, "loss": 1.138, "step": 24022 }, { "epoch": 0.72, "learning_rate": 9.359959648272901e-07, "loss": 1.2424, "step": 24023 }, { "epoch": 0.72, "learning_rate": 9.358056798286982e-07, "loss": 1.0884, "step": 24024 }, { "epoch": 0.72, "learning_rate": 9.356154097204828e-07, "loss": 1.1171, "step": 24025 }, { "epoch": 0.72, "learning_rate": 9.354251545044554e-07, "loss": 1.0686, "step": 24026 }, { "epoch": 0.72, "learning_rate": 9.352349141824268e-07, "loss": 1.0282, "step": 24027 }, { "epoch": 0.72, "learning_rate": 9.350446887562093e-07, "loss": 1.0237, "step": 24028 }, { "epoch": 0.72, "learning_rate": 9.348544782276115e-07, "loss": 1.1126, "step": 24029 }, { "epoch": 0.72, "learning_rate": 9.346642825984453e-07, "loss": 1.0557, "step": 24030 }, { "epoch": 0.72, "learning_rate": 9.344741018705214e-07, "loss": 1.1635, "step": 24031 }, { "epoch": 0.72, "learning_rate": 9.34283936045651e-07, "loss": 1.1729, "step": 24032 }, { "epoch": 0.72, "learning_rate": 9.340937851256424e-07, "loss": 1.1623, "step": 24033 }, { "epoch": 0.72, "learning_rate": 9.339036491123069e-07, "loss": 1.0178, "step": 24034 }, { "epoch": 0.72, "learning_rate": 9.337135280074544e-07, "loss": 1.0614, "step": 24035 }, { "epoch": 0.72, "learning_rate": 9.335234218128946e-07, "loss": 1.1103, "step": 24036 }, { "epoch": 0.72, "learning_rate": 9.333333305304377e-07, "loss": 1.158, "step": 24037 }, { "epoch": 0.72, "learning_rate": 9.331432541618929e-07, "loss": 1.0443, "step": 24038 }, { "epoch": 0.72, "learning_rate": 9.329531927090696e-07, "loss": 0.9999, "step": 24039 }, { "epoch": 0.72, "learning_rate": 9.327631461737771e-07, "loss": 1.022, "step": 24040 }, { "epoch": 0.72, "learning_rate": 9.325731145578257e-07, "loss": 1.0453, "step": 24041 }, { "epoch": 0.72, "learning_rate": 9.323830978630221e-07, "loss": 1.1378, "step": 24042 }, { "epoch": 0.72, "learning_rate": 9.321930960911768e-07, "loss": 1.0821, "step": 24043 }, { "epoch": 0.72, "learning_rate": 9.320031092440981e-07, "loss": 1.0894, "step": 24044 }, { "epoch": 0.72, "learning_rate": 9.318131373235953e-07, "loss": 1.1423, "step": 24045 }, { "epoch": 0.72, "learning_rate": 9.316231803314755e-07, "loss": 1.1129, "step": 24046 }, { "epoch": 0.72, "learning_rate": 9.314332382695477e-07, "loss": 1.0684, "step": 24047 }, { "epoch": 0.72, "learning_rate": 9.312433111396199e-07, "loss": 1.1064, "step": 24048 }, { "epoch": 0.72, "learning_rate": 9.310533989435011e-07, "loss": 1.1175, "step": 24049 }, { "epoch": 0.72, "learning_rate": 9.308635016829975e-07, "loss": 1.1097, "step": 24050 }, { "epoch": 0.72, "learning_rate": 9.306736193599175e-07, "loss": 1.0576, "step": 24051 }, { "epoch": 0.72, "learning_rate": 9.304837519760689e-07, "loss": 1.001, "step": 24052 }, { "epoch": 0.72, "learning_rate": 9.302938995332591e-07, "loss": 1.1277, "step": 24053 }, { "epoch": 0.72, "learning_rate": 9.301040620332962e-07, "loss": 1.0656, "step": 24054 }, { "epoch": 0.72, "learning_rate": 9.299142394779858e-07, "loss": 1.1548, "step": 24055 }, { "epoch": 0.72, "learning_rate": 9.297244318691356e-07, "loss": 1.1344, "step": 24056 }, { "epoch": 0.72, "learning_rate": 9.295346392085528e-07, "loss": 1.1819, "step": 24057 }, { "epoch": 0.72, "learning_rate": 9.293448614980444e-07, "loss": 1.108, "step": 24058 }, { "epoch": 0.72, "learning_rate": 9.291550987394157e-07, "loss": 1.1296, "step": 24059 }, { "epoch": 0.72, "learning_rate": 9.289653509344738e-07, "loss": 1.0663, "step": 24060 }, { "epoch": 0.72, "learning_rate": 9.287756180850252e-07, "loss": 1.0352, "step": 24061 }, { "epoch": 0.72, "learning_rate": 9.28585900192876e-07, "loss": 1.0631, "step": 24062 }, { "epoch": 0.72, "learning_rate": 9.283961972598321e-07, "loss": 1.1508, "step": 24063 }, { "epoch": 0.72, "learning_rate": 9.282065092876996e-07, "loss": 1.201, "step": 24064 }, { "epoch": 0.72, "learning_rate": 9.280168362782852e-07, "loss": 1.088, "step": 24065 }, { "epoch": 0.72, "learning_rate": 9.278271782333923e-07, "loss": 1.0608, "step": 24066 }, { "epoch": 0.73, "learning_rate": 9.276375351548275e-07, "loss": 1.0642, "step": 24067 }, { "epoch": 0.73, "learning_rate": 9.274479070443962e-07, "loss": 0.9308, "step": 24068 }, { "epoch": 0.73, "learning_rate": 9.272582939039035e-07, "loss": 1.1486, "step": 24069 }, { "epoch": 0.73, "learning_rate": 9.270686957351541e-07, "loss": 1.095, "step": 24070 }, { "epoch": 0.73, "learning_rate": 9.268791125399543e-07, "loss": 1.2545, "step": 24071 }, { "epoch": 0.73, "learning_rate": 9.266895443201066e-07, "loss": 1.0978, "step": 24072 }, { "epoch": 0.73, "learning_rate": 9.264999910774169e-07, "loss": 1.1293, "step": 24073 }, { "epoch": 0.73, "learning_rate": 9.263104528136893e-07, "loss": 1.1786, "step": 24074 }, { "epoch": 0.73, "learning_rate": 9.261209295307294e-07, "loss": 1.0774, "step": 24075 }, { "epoch": 0.73, "learning_rate": 9.259314212303391e-07, "loss": 1.1318, "step": 24076 }, { "epoch": 0.73, "learning_rate": 9.257419279143237e-07, "loss": 1.053, "step": 24077 }, { "epoch": 0.73, "learning_rate": 9.25552449584487e-07, "loss": 1.0355, "step": 24078 }, { "epoch": 0.73, "learning_rate": 9.253629862426327e-07, "loss": 1.1369, "step": 24079 }, { "epoch": 0.73, "learning_rate": 9.251735378905652e-07, "loss": 1.1718, "step": 24080 }, { "epoch": 0.73, "learning_rate": 9.249841045300864e-07, "loss": 1.1504, "step": 24081 }, { "epoch": 0.73, "learning_rate": 9.247946861630003e-07, "loss": 1.1039, "step": 24082 }, { "epoch": 0.73, "learning_rate": 9.2460528279111e-07, "loss": 1.0939, "step": 24083 }, { "epoch": 0.73, "learning_rate": 9.244158944162199e-07, "loss": 1.1327, "step": 24084 }, { "epoch": 0.73, "learning_rate": 9.242265210401305e-07, "loss": 1.099, "step": 24085 }, { "epoch": 0.73, "learning_rate": 9.240371626646458e-07, "loss": 1.2062, "step": 24086 }, { "epoch": 0.73, "learning_rate": 9.238478192915681e-07, "loss": 1.0546, "step": 24087 }, { "epoch": 0.73, "learning_rate": 9.236584909227012e-07, "loss": 1.2056, "step": 24088 }, { "epoch": 0.73, "learning_rate": 9.234691775598453e-07, "loss": 1.0274, "step": 24089 }, { "epoch": 0.73, "learning_rate": 9.232798792048034e-07, "loss": 1.1859, "step": 24090 }, { "epoch": 0.73, "learning_rate": 9.23090595859378e-07, "loss": 1.1199, "step": 24091 }, { "epoch": 0.73, "learning_rate": 9.229013275253704e-07, "loss": 1.1724, "step": 24092 }, { "epoch": 0.73, "learning_rate": 9.227120742045828e-07, "loss": 1.0851, "step": 24093 }, { "epoch": 0.73, "learning_rate": 9.225228358988164e-07, "loss": 1.1035, "step": 24094 }, { "epoch": 0.73, "learning_rate": 9.223336126098728e-07, "loss": 0.967, "step": 24095 }, { "epoch": 0.73, "learning_rate": 9.221444043395536e-07, "loss": 1.0883, "step": 24096 }, { "epoch": 0.73, "learning_rate": 9.219552110896606e-07, "loss": 1.2108, "step": 24097 }, { "epoch": 0.73, "learning_rate": 9.217660328619932e-07, "loss": 1.1948, "step": 24098 }, { "epoch": 0.73, "learning_rate": 9.215768696583527e-07, "loss": 1.0504, "step": 24099 }, { "epoch": 0.73, "learning_rate": 9.213877214805405e-07, "loss": 1.1074, "step": 24100 }, { "epoch": 0.73, "learning_rate": 9.211985883303578e-07, "loss": 1.0661, "step": 24101 }, { "epoch": 0.73, "learning_rate": 9.210094702096032e-07, "loss": 1.0607, "step": 24102 }, { "epoch": 0.73, "learning_rate": 9.20820367120078e-07, "loss": 1.0638, "step": 24103 }, { "epoch": 0.73, "learning_rate": 9.206312790635821e-07, "loss": 1.0786, "step": 24104 }, { "epoch": 0.73, "learning_rate": 9.204422060419168e-07, "loss": 1.1373, "step": 24105 }, { "epoch": 0.73, "learning_rate": 9.202531480568803e-07, "loss": 1.2493, "step": 24106 }, { "epoch": 0.73, "learning_rate": 9.200641051102729e-07, "loss": 1.01, "step": 24107 }, { "epoch": 0.73, "learning_rate": 9.198750772038942e-07, "loss": 1.0703, "step": 24108 }, { "epoch": 0.73, "learning_rate": 9.196860643395439e-07, "loss": 0.9136, "step": 24109 }, { "epoch": 0.73, "learning_rate": 9.19497066519022e-07, "loss": 1.1085, "step": 24110 }, { "epoch": 0.73, "learning_rate": 9.193080837441257e-07, "loss": 1.1405, "step": 24111 }, { "epoch": 0.73, "learning_rate": 9.191191160166554e-07, "loss": 1.1989, "step": 24112 }, { "epoch": 0.73, "learning_rate": 9.189301633384096e-07, "loss": 1.1187, "step": 24113 }, { "epoch": 0.73, "learning_rate": 9.187412257111883e-07, "loss": 1.0716, "step": 24114 }, { "epoch": 0.73, "learning_rate": 9.18552303136788e-07, "loss": 1.1333, "step": 24115 }, { "epoch": 0.73, "learning_rate": 9.18363395617008e-07, "loss": 1.0342, "step": 24116 }, { "epoch": 0.73, "learning_rate": 9.181745031536466e-07, "loss": 1.0963, "step": 24117 }, { "epoch": 0.73, "learning_rate": 9.179856257485024e-07, "loss": 1.1434, "step": 24118 }, { "epoch": 0.73, "learning_rate": 9.17796763403373e-07, "loss": 1.0125, "step": 24119 }, { "epoch": 0.73, "learning_rate": 9.176079161200563e-07, "loss": 1.2035, "step": 24120 }, { "epoch": 0.73, "learning_rate": 9.174190839003503e-07, "loss": 1.161, "step": 24121 }, { "epoch": 0.73, "learning_rate": 9.172302667460523e-07, "loss": 1.1268, "step": 24122 }, { "epoch": 0.73, "learning_rate": 9.170414646589606e-07, "loss": 1.1428, "step": 24123 }, { "epoch": 0.73, "learning_rate": 9.168526776408712e-07, "loss": 1.1061, "step": 24124 }, { "epoch": 0.73, "learning_rate": 9.166639056935819e-07, "loss": 1.0115, "step": 24125 }, { "epoch": 0.73, "learning_rate": 9.164751488188894e-07, "loss": 1.0906, "step": 24126 }, { "epoch": 0.73, "learning_rate": 9.162864070185917e-07, "loss": 1.0989, "step": 24127 }, { "epoch": 0.73, "learning_rate": 9.160976802944841e-07, "loss": 1.0367, "step": 24128 }, { "epoch": 0.73, "learning_rate": 9.159089686483635e-07, "loss": 1.0957, "step": 24129 }, { "epoch": 0.73, "learning_rate": 9.157202720820266e-07, "loss": 1.1472, "step": 24130 }, { "epoch": 0.73, "learning_rate": 9.155315905972706e-07, "loss": 1.0864, "step": 24131 }, { "epoch": 0.73, "learning_rate": 9.1534292419589e-07, "loss": 1.1685, "step": 24132 }, { "epoch": 0.73, "learning_rate": 9.151542728796814e-07, "loss": 1.1127, "step": 24133 }, { "epoch": 0.73, "learning_rate": 9.149656366504408e-07, "loss": 0.9428, "step": 24134 }, { "epoch": 0.73, "learning_rate": 9.147770155099639e-07, "loss": 1.082, "step": 24135 }, { "epoch": 0.73, "learning_rate": 9.145884094600474e-07, "loss": 1.1337, "step": 24136 }, { "epoch": 0.73, "learning_rate": 9.143998185024849e-07, "loss": 1.0848, "step": 24137 }, { "epoch": 0.73, "learning_rate": 9.142112426390723e-07, "loss": 1.1032, "step": 24138 }, { "epoch": 0.73, "learning_rate": 9.14022681871605e-07, "loss": 1.1108, "step": 24139 }, { "epoch": 0.73, "learning_rate": 9.138341362018788e-07, "loss": 1.1367, "step": 24140 }, { "epoch": 0.73, "learning_rate": 9.136456056316866e-07, "loss": 1.1199, "step": 24141 }, { "epoch": 0.73, "learning_rate": 9.134570901628245e-07, "loss": 1.0234, "step": 24142 }, { "epoch": 0.73, "learning_rate": 9.132685897970867e-07, "loss": 1.1313, "step": 24143 }, { "epoch": 0.73, "learning_rate": 9.130801045362678e-07, "loss": 1.0309, "step": 24144 }, { "epoch": 0.73, "learning_rate": 9.12891634382162e-07, "loss": 1.1317, "step": 24145 }, { "epoch": 0.73, "learning_rate": 9.127031793365634e-07, "loss": 1.1693, "step": 24146 }, { "epoch": 0.73, "learning_rate": 9.125147394012671e-07, "loss": 1.0927, "step": 24147 }, { "epoch": 0.73, "learning_rate": 9.123263145780647e-07, "loss": 1.0436, "step": 24148 }, { "epoch": 0.73, "learning_rate": 9.121379048687515e-07, "loss": 1.2793, "step": 24149 }, { "epoch": 0.73, "learning_rate": 9.119495102751206e-07, "loss": 1.2409, "step": 24150 }, { "epoch": 0.73, "learning_rate": 9.117611307989654e-07, "loss": 1.0852, "step": 24151 }, { "epoch": 0.73, "learning_rate": 9.115727664420793e-07, "loss": 1.1877, "step": 24152 }, { "epoch": 0.73, "learning_rate": 9.113844172062566e-07, "loss": 1.0869, "step": 24153 }, { "epoch": 0.73, "learning_rate": 9.111960830932881e-07, "loss": 1.053, "step": 24154 }, { "epoch": 0.73, "learning_rate": 9.110077641049675e-07, "loss": 1.0769, "step": 24155 }, { "epoch": 0.73, "learning_rate": 9.108194602430881e-07, "loss": 1.1242, "step": 24156 }, { "epoch": 0.73, "learning_rate": 9.106311715094427e-07, "loss": 1.1646, "step": 24157 }, { "epoch": 0.73, "learning_rate": 9.104428979058222e-07, "loss": 1.0717, "step": 24158 }, { "epoch": 0.73, "learning_rate": 9.102546394340198e-07, "loss": 1.1141, "step": 24159 }, { "epoch": 0.73, "learning_rate": 9.100663960958275e-07, "loss": 1.0134, "step": 24160 }, { "epoch": 0.73, "learning_rate": 9.098781678930374e-07, "loss": 1.1727, "step": 24161 }, { "epoch": 0.73, "learning_rate": 9.096899548274424e-07, "loss": 1.1561, "step": 24162 }, { "epoch": 0.73, "learning_rate": 9.095017569008319e-07, "loss": 1.0278, "step": 24163 }, { "epoch": 0.73, "learning_rate": 9.093135741149988e-07, "loss": 1.0965, "step": 24164 }, { "epoch": 0.73, "learning_rate": 9.091254064717345e-07, "loss": 1.1305, "step": 24165 }, { "epoch": 0.73, "learning_rate": 9.089372539728308e-07, "loss": 1.1649, "step": 24166 }, { "epoch": 0.73, "learning_rate": 9.087491166200774e-07, "loss": 1.0907, "step": 24167 }, { "epoch": 0.73, "learning_rate": 9.085609944152662e-07, "loss": 1.2262, "step": 24168 }, { "epoch": 0.73, "learning_rate": 9.083728873601877e-07, "loss": 1.096, "step": 24169 }, { "epoch": 0.73, "learning_rate": 9.081847954566336e-07, "loss": 1.0225, "step": 24170 }, { "epoch": 0.73, "learning_rate": 9.079967187063929e-07, "loss": 1.1055, "step": 24171 }, { "epoch": 0.73, "learning_rate": 9.078086571112566e-07, "loss": 0.9995, "step": 24172 }, { "epoch": 0.73, "learning_rate": 9.076206106730148e-07, "loss": 1.0865, "step": 24173 }, { "epoch": 0.73, "learning_rate": 9.074325793934582e-07, "loss": 1.0618, "step": 24174 }, { "epoch": 0.73, "learning_rate": 9.072445632743763e-07, "loss": 1.0905, "step": 24175 }, { "epoch": 0.73, "learning_rate": 9.070565623175593e-07, "loss": 1.0667, "step": 24176 }, { "epoch": 0.73, "learning_rate": 9.068685765247962e-07, "loss": 1.1091, "step": 24177 }, { "epoch": 0.73, "learning_rate": 9.066806058978773e-07, "loss": 1.0767, "step": 24178 }, { "epoch": 0.73, "learning_rate": 9.064926504385923e-07, "loss": 1.1825, "step": 24179 }, { "epoch": 0.73, "learning_rate": 9.063047101487293e-07, "loss": 1.1497, "step": 24180 }, { "epoch": 0.73, "learning_rate": 9.061167850300775e-07, "loss": 1.1179, "step": 24181 }, { "epoch": 0.73, "learning_rate": 9.059288750844266e-07, "loss": 1.1013, "step": 24182 }, { "epoch": 0.73, "learning_rate": 9.057409803135658e-07, "loss": 1.0962, "step": 24183 }, { "epoch": 0.73, "learning_rate": 9.055531007192822e-07, "loss": 1.1105, "step": 24184 }, { "epoch": 0.73, "learning_rate": 9.053652363033652e-07, "loss": 1.0858, "step": 24185 }, { "epoch": 0.73, "learning_rate": 9.051773870676031e-07, "loss": 1.0844, "step": 24186 }, { "epoch": 0.73, "learning_rate": 9.049895530137842e-07, "loss": 1.0546, "step": 24187 }, { "epoch": 0.73, "learning_rate": 9.048017341436974e-07, "loss": 1.2038, "step": 24188 }, { "epoch": 0.73, "learning_rate": 9.046139304591289e-07, "loss": 1.2371, "step": 24189 }, { "epoch": 0.73, "learning_rate": 9.044261419618675e-07, "loss": 1.062, "step": 24190 }, { "epoch": 0.73, "learning_rate": 9.042383686537007e-07, "loss": 1.1705, "step": 24191 }, { "epoch": 0.73, "learning_rate": 9.040506105364172e-07, "loss": 1.0554, "step": 24192 }, { "epoch": 0.73, "learning_rate": 9.038628676118022e-07, "loss": 1.0785, "step": 24193 }, { "epoch": 0.73, "learning_rate": 9.036751398816437e-07, "loss": 1.2123, "step": 24194 }, { "epoch": 0.73, "learning_rate": 9.034874273477295e-07, "loss": 1.0743, "step": 24195 }, { "epoch": 0.73, "learning_rate": 9.032997300118468e-07, "loss": 1.0964, "step": 24196 }, { "epoch": 0.73, "learning_rate": 9.031120478757807e-07, "loss": 1.0764, "step": 24197 }, { "epoch": 0.73, "learning_rate": 9.02924380941319e-07, "loss": 1.0477, "step": 24198 }, { "epoch": 0.73, "learning_rate": 9.027367292102479e-07, "loss": 1.0622, "step": 24199 }, { "epoch": 0.73, "learning_rate": 9.025490926843538e-07, "loss": 0.9748, "step": 24200 }, { "epoch": 0.73, "learning_rate": 9.023614713654233e-07, "loss": 1.2002, "step": 24201 }, { "epoch": 0.73, "learning_rate": 9.021738652552417e-07, "loss": 1.099, "step": 24202 }, { "epoch": 0.73, "learning_rate": 9.019862743555957e-07, "loss": 1.1049, "step": 24203 }, { "epoch": 0.73, "learning_rate": 9.017986986682706e-07, "loss": 1.0891, "step": 24204 }, { "epoch": 0.73, "learning_rate": 9.016111381950529e-07, "loss": 1.1582, "step": 24205 }, { "epoch": 0.73, "learning_rate": 9.014235929377269e-07, "loss": 1.1025, "step": 24206 }, { "epoch": 0.73, "learning_rate": 9.012360628980779e-07, "loss": 1.0557, "step": 24207 }, { "epoch": 0.73, "learning_rate": 9.010485480778918e-07, "loss": 1.0858, "step": 24208 }, { "epoch": 0.73, "learning_rate": 9.008610484789543e-07, "loss": 1.065, "step": 24209 }, { "epoch": 0.73, "learning_rate": 9.006735641030487e-07, "loss": 1.1786, "step": 24210 }, { "epoch": 0.73, "learning_rate": 9.004860949519603e-07, "loss": 1.1051, "step": 24211 }, { "epoch": 0.73, "learning_rate": 9.002986410274742e-07, "loss": 1.1718, "step": 24212 }, { "epoch": 0.73, "learning_rate": 9.001112023313744e-07, "loss": 1.0873, "step": 24213 }, { "epoch": 0.73, "learning_rate": 8.999237788654463e-07, "loss": 1.1251, "step": 24214 }, { "epoch": 0.73, "learning_rate": 8.997363706314724e-07, "loss": 1.0484, "step": 24215 }, { "epoch": 0.73, "learning_rate": 8.995489776312375e-07, "loss": 1.1236, "step": 24216 }, { "epoch": 0.73, "learning_rate": 8.993615998665256e-07, "loss": 1.1005, "step": 24217 }, { "epoch": 0.73, "learning_rate": 8.99174237339121e-07, "loss": 1.1886, "step": 24218 }, { "epoch": 0.73, "learning_rate": 8.989868900508062e-07, "loss": 1.201, "step": 24219 }, { "epoch": 0.73, "learning_rate": 8.987995580033648e-07, "loss": 1.0217, "step": 24220 }, { "epoch": 0.73, "learning_rate": 8.986122411985804e-07, "loss": 1.0572, "step": 24221 }, { "epoch": 0.73, "learning_rate": 8.984249396382372e-07, "loss": 1.0716, "step": 24222 }, { "epoch": 0.73, "learning_rate": 8.982376533241166e-07, "loss": 1.0702, "step": 24223 }, { "epoch": 0.73, "learning_rate": 8.980503822580017e-07, "loss": 1.108, "step": 24224 }, { "epoch": 0.73, "learning_rate": 8.97863126441676e-07, "loss": 1.114, "step": 24225 }, { "epoch": 0.73, "learning_rate": 8.976758858769216e-07, "loss": 1.1284, "step": 24226 }, { "epoch": 0.73, "learning_rate": 8.974886605655208e-07, "loss": 1.1818, "step": 24227 }, { "epoch": 0.73, "learning_rate": 8.973014505092565e-07, "loss": 1.1068, "step": 24228 }, { "epoch": 0.73, "learning_rate": 8.971142557099113e-07, "loss": 1.0449, "step": 24229 }, { "epoch": 0.73, "learning_rate": 8.969270761692652e-07, "loss": 1.0851, "step": 24230 }, { "epoch": 0.73, "learning_rate": 8.967399118891019e-07, "loss": 1.11, "step": 24231 }, { "epoch": 0.73, "learning_rate": 8.965527628712021e-07, "loss": 1.1637, "step": 24232 }, { "epoch": 0.73, "learning_rate": 8.963656291173476e-07, "loss": 1.0936, "step": 24233 }, { "epoch": 0.73, "learning_rate": 8.961785106293202e-07, "loss": 0.9727, "step": 24234 }, { "epoch": 0.73, "learning_rate": 8.959914074089018e-07, "loss": 1.0091, "step": 24235 }, { "epoch": 0.73, "learning_rate": 8.958043194578717e-07, "loss": 1.2193, "step": 24236 }, { "epoch": 0.73, "learning_rate": 8.95617246778012e-07, "loss": 1.1716, "step": 24237 }, { "epoch": 0.73, "learning_rate": 8.954301893711034e-07, "loss": 1.0492, "step": 24238 }, { "epoch": 0.73, "learning_rate": 8.952431472389267e-07, "loss": 1.1596, "step": 24239 }, { "epoch": 0.73, "learning_rate": 8.95056120383263e-07, "loss": 1.0631, "step": 24240 }, { "epoch": 0.73, "learning_rate": 8.948691088058914e-07, "loss": 1.0579, "step": 24241 }, { "epoch": 0.73, "learning_rate": 8.946821125085928e-07, "loss": 1.1064, "step": 24242 }, { "epoch": 0.73, "learning_rate": 8.944951314931471e-07, "loss": 1.1792, "step": 24243 }, { "epoch": 0.73, "learning_rate": 8.943081657613356e-07, "loss": 1.1606, "step": 24244 }, { "epoch": 0.73, "learning_rate": 8.941212153149362e-07, "loss": 1.1124, "step": 24245 }, { "epoch": 0.73, "learning_rate": 8.939342801557293e-07, "loss": 1.0919, "step": 24246 }, { "epoch": 0.73, "learning_rate": 8.937473602854945e-07, "loss": 1.0607, "step": 24247 }, { "epoch": 0.73, "learning_rate": 8.935604557060124e-07, "loss": 1.0491, "step": 24248 }, { "epoch": 0.73, "learning_rate": 8.933735664190598e-07, "loss": 1.147, "step": 24249 }, { "epoch": 0.73, "learning_rate": 8.931866924264173e-07, "loss": 1.065, "step": 24250 }, { "epoch": 0.73, "learning_rate": 8.929998337298637e-07, "loss": 1.0923, "step": 24251 }, { "epoch": 0.73, "learning_rate": 8.928129903311774e-07, "loss": 1.1547, "step": 24252 }, { "epoch": 0.73, "learning_rate": 8.926261622321386e-07, "loss": 1.101, "step": 24253 }, { "epoch": 0.73, "learning_rate": 8.924393494345235e-07, "loss": 1.1398, "step": 24254 }, { "epoch": 0.73, "learning_rate": 8.922525519401118e-07, "loss": 1.0781, "step": 24255 }, { "epoch": 0.73, "learning_rate": 8.920657697506813e-07, "loss": 1.1476, "step": 24256 }, { "epoch": 0.73, "learning_rate": 8.918790028680102e-07, "loss": 1.1379, "step": 24257 }, { "epoch": 0.73, "learning_rate": 8.916922512938766e-07, "loss": 1.0685, "step": 24258 }, { "epoch": 0.73, "learning_rate": 8.915055150300583e-07, "loss": 0.9938, "step": 24259 }, { "epoch": 0.73, "learning_rate": 8.913187940783327e-07, "loss": 1.0715, "step": 24260 }, { "epoch": 0.73, "learning_rate": 8.911320884404781e-07, "loss": 1.2554, "step": 24261 }, { "epoch": 0.73, "learning_rate": 8.909453981182705e-07, "loss": 1.2302, "step": 24262 }, { "epoch": 0.73, "learning_rate": 8.907587231134879e-07, "loss": 1.1116, "step": 24263 }, { "epoch": 0.73, "learning_rate": 8.905720634279069e-07, "loss": 1.2148, "step": 24264 }, { "epoch": 0.73, "learning_rate": 8.903854190633049e-07, "loss": 1.0059, "step": 24265 }, { "epoch": 0.73, "learning_rate": 8.901987900214595e-07, "loss": 1.1149, "step": 24266 }, { "epoch": 0.73, "learning_rate": 8.900121763041453e-07, "loss": 1.0782, "step": 24267 }, { "epoch": 0.73, "learning_rate": 8.898255779131398e-07, "loss": 1.1371, "step": 24268 }, { "epoch": 0.73, "learning_rate": 8.896389948502193e-07, "loss": 1.0112, "step": 24269 }, { "epoch": 0.73, "learning_rate": 8.894524271171607e-07, "loss": 1.0659, "step": 24270 }, { "epoch": 0.73, "learning_rate": 8.892658747157387e-07, "loss": 1.0526, "step": 24271 }, { "epoch": 0.73, "learning_rate": 8.890793376477297e-07, "loss": 1.0671, "step": 24272 }, { "epoch": 0.73, "learning_rate": 8.888928159149096e-07, "loss": 1.1208, "step": 24273 }, { "epoch": 0.73, "learning_rate": 8.887063095190549e-07, "loss": 1.1466, "step": 24274 }, { "epoch": 0.73, "learning_rate": 8.88519818461939e-07, "loss": 1.2357, "step": 24275 }, { "epoch": 0.73, "learning_rate": 8.883333427453387e-07, "loss": 1.1279, "step": 24276 }, { "epoch": 0.73, "learning_rate": 8.881468823710282e-07, "loss": 1.1008, "step": 24277 }, { "epoch": 0.73, "learning_rate": 8.879604373407844e-07, "loss": 1.0886, "step": 24278 }, { "epoch": 0.73, "learning_rate": 8.877740076563799e-07, "loss": 1.0764, "step": 24279 }, { "epoch": 0.73, "learning_rate": 8.875875933195905e-07, "loss": 1.1132, "step": 24280 }, { "epoch": 0.73, "learning_rate": 8.874011943321903e-07, "loss": 1.2052, "step": 24281 }, { "epoch": 0.73, "learning_rate": 8.872148106959543e-07, "loss": 1.1575, "step": 24282 }, { "epoch": 0.73, "learning_rate": 8.870284424126565e-07, "loss": 1.2061, "step": 24283 }, { "epoch": 0.73, "learning_rate": 8.868420894840712e-07, "loss": 0.9135, "step": 24284 }, { "epoch": 0.73, "learning_rate": 8.86655751911972e-07, "loss": 1.2341, "step": 24285 }, { "epoch": 0.73, "learning_rate": 8.864694296981333e-07, "loss": 1.1547, "step": 24286 }, { "epoch": 0.73, "learning_rate": 8.862831228443294e-07, "loss": 1.1824, "step": 24287 }, { "epoch": 0.73, "learning_rate": 8.860968313523318e-07, "loss": 1.0437, "step": 24288 }, { "epoch": 0.73, "learning_rate": 8.859105552239155e-07, "loss": 1.1811, "step": 24289 }, { "epoch": 0.73, "learning_rate": 8.857242944608532e-07, "loss": 1.0682, "step": 24290 }, { "epoch": 0.73, "learning_rate": 8.85538049064919e-07, "loss": 1.0651, "step": 24291 }, { "epoch": 0.73, "learning_rate": 8.85351819037884e-07, "loss": 1.1109, "step": 24292 }, { "epoch": 0.73, "learning_rate": 8.851656043815223e-07, "loss": 1.1341, "step": 24293 }, { "epoch": 0.73, "learning_rate": 8.849794050976063e-07, "loss": 1.0027, "step": 24294 }, { "epoch": 0.73, "learning_rate": 8.847932211879082e-07, "loss": 1.0763, "step": 24295 }, { "epoch": 0.73, "learning_rate": 8.846070526542019e-07, "loss": 1.2005, "step": 24296 }, { "epoch": 0.73, "learning_rate": 8.844208994982576e-07, "loss": 1.0746, "step": 24297 }, { "epoch": 0.73, "learning_rate": 8.84234761721848e-07, "loss": 1.1322, "step": 24298 }, { "epoch": 0.73, "learning_rate": 8.840486393267456e-07, "loss": 1.162, "step": 24299 }, { "epoch": 0.73, "learning_rate": 8.838625323147227e-07, "loss": 1.0858, "step": 24300 }, { "epoch": 0.73, "learning_rate": 8.836764406875489e-07, "loss": 1.0543, "step": 24301 }, { "epoch": 0.73, "learning_rate": 8.834903644469975e-07, "loss": 1.157, "step": 24302 }, { "epoch": 0.73, "learning_rate": 8.833043035948389e-07, "loss": 1.0749, "step": 24303 }, { "epoch": 0.73, "learning_rate": 8.831182581328457e-07, "loss": 1.0531, "step": 24304 }, { "epoch": 0.73, "learning_rate": 8.829322280627869e-07, "loss": 1.1376, "step": 24305 }, { "epoch": 0.73, "learning_rate": 8.827462133864348e-07, "loss": 1.1149, "step": 24306 }, { "epoch": 0.73, "learning_rate": 8.825602141055598e-07, "loss": 1.0386, "step": 24307 }, { "epoch": 0.73, "learning_rate": 8.823742302219324e-07, "loss": 1.1756, "step": 24308 }, { "epoch": 0.73, "learning_rate": 8.821882617373234e-07, "loss": 1.0903, "step": 24309 }, { "epoch": 0.73, "learning_rate": 8.820023086535029e-07, "loss": 1.1122, "step": 24310 }, { "epoch": 0.73, "learning_rate": 8.81816370972241e-07, "loss": 1.0981, "step": 24311 }, { "epoch": 0.73, "learning_rate": 8.81630448695309e-07, "loss": 1.2214, "step": 24312 }, { "epoch": 0.73, "learning_rate": 8.814445418244749e-07, "loss": 1.1441, "step": 24313 }, { "epoch": 0.73, "learning_rate": 8.81258650361509e-07, "loss": 1.153, "step": 24314 }, { "epoch": 0.73, "learning_rate": 8.810727743081812e-07, "loss": 1.1992, "step": 24315 }, { "epoch": 0.73, "learning_rate": 8.808869136662609e-07, "loss": 1.0023, "step": 24316 }, { "epoch": 0.73, "learning_rate": 8.807010684375183e-07, "loss": 1.1584, "step": 24317 }, { "epoch": 0.73, "learning_rate": 8.80515238623721e-07, "loss": 1.1841, "step": 24318 }, { "epoch": 0.73, "learning_rate": 8.803294242266384e-07, "loss": 1.1458, "step": 24319 }, { "epoch": 0.73, "learning_rate": 8.801436252480397e-07, "loss": 1.0901, "step": 24320 }, { "epoch": 0.73, "learning_rate": 8.799578416896934e-07, "loss": 1.133, "step": 24321 }, { "epoch": 0.73, "learning_rate": 8.797720735533691e-07, "loss": 1.0174, "step": 24322 }, { "epoch": 0.73, "learning_rate": 8.795863208408337e-07, "loss": 1.182, "step": 24323 }, { "epoch": 0.73, "learning_rate": 8.794005835538558e-07, "loss": 1.2932, "step": 24324 }, { "epoch": 0.73, "learning_rate": 8.792148616942043e-07, "loss": 1.0171, "step": 24325 }, { "epoch": 0.73, "learning_rate": 8.790291552636471e-07, "loss": 1.0931, "step": 24326 }, { "epoch": 0.73, "learning_rate": 8.78843464263951e-07, "loss": 1.0846, "step": 24327 }, { "epoch": 0.73, "learning_rate": 8.786577886968842e-07, "loss": 0.9265, "step": 24328 }, { "epoch": 0.73, "learning_rate": 8.784721285642145e-07, "loss": 1.0624, "step": 24329 }, { "epoch": 0.73, "learning_rate": 8.782864838677099e-07, "loss": 1.0966, "step": 24330 }, { "epoch": 0.73, "learning_rate": 8.781008546091363e-07, "loss": 1.0193, "step": 24331 }, { "epoch": 0.73, "learning_rate": 8.779152407902613e-07, "loss": 0.9966, "step": 24332 }, { "epoch": 0.73, "learning_rate": 8.77729642412852e-07, "loss": 1.0969, "step": 24333 }, { "epoch": 0.73, "learning_rate": 8.775440594786752e-07, "loss": 1.0883, "step": 24334 }, { "epoch": 0.73, "learning_rate": 8.773584919894984e-07, "loss": 1.1412, "step": 24335 }, { "epoch": 0.73, "learning_rate": 8.771729399470866e-07, "loss": 1.1696, "step": 24336 }, { "epoch": 0.73, "learning_rate": 8.769874033532067e-07, "loss": 1.1617, "step": 24337 }, { "epoch": 0.73, "learning_rate": 8.768018822096249e-07, "loss": 1.1781, "step": 24338 }, { "epoch": 0.73, "learning_rate": 8.766163765181076e-07, "loss": 1.1476, "step": 24339 }, { "epoch": 0.73, "learning_rate": 8.764308862804205e-07, "loss": 0.9913, "step": 24340 }, { "epoch": 0.73, "learning_rate": 8.762454114983293e-07, "loss": 1.1365, "step": 24341 }, { "epoch": 0.73, "learning_rate": 8.760599521735999e-07, "loss": 1.0755, "step": 24342 }, { "epoch": 0.73, "learning_rate": 8.758745083079983e-07, "loss": 1.2251, "step": 24343 }, { "epoch": 0.73, "learning_rate": 8.756890799032886e-07, "loss": 1.0222, "step": 24344 }, { "epoch": 0.73, "learning_rate": 8.755036669612366e-07, "loss": 1.0692, "step": 24345 }, { "epoch": 0.73, "learning_rate": 8.753182694836071e-07, "loss": 1.0557, "step": 24346 }, { "epoch": 0.73, "learning_rate": 8.751328874721651e-07, "loss": 1.0607, "step": 24347 }, { "epoch": 0.73, "learning_rate": 8.749475209286764e-07, "loss": 1.135, "step": 24348 }, { "epoch": 0.73, "learning_rate": 8.747621698549039e-07, "loss": 1.2321, "step": 24349 }, { "epoch": 0.73, "learning_rate": 8.745768342526128e-07, "loss": 1.0753, "step": 24350 }, { "epoch": 0.73, "learning_rate": 8.743915141235674e-07, "loss": 1.1709, "step": 24351 }, { "epoch": 0.73, "learning_rate": 8.742062094695325e-07, "loss": 1.0991, "step": 24352 }, { "epoch": 0.73, "learning_rate": 8.740209202922708e-07, "loss": 1.1564, "step": 24353 }, { "epoch": 0.73, "learning_rate": 8.738356465935468e-07, "loss": 1.1193, "step": 24354 }, { "epoch": 0.73, "learning_rate": 8.736503883751243e-07, "loss": 1.2103, "step": 24355 }, { "epoch": 0.73, "learning_rate": 8.734651456387677e-07, "loss": 1.1924, "step": 24356 }, { "epoch": 0.73, "learning_rate": 8.732799183862386e-07, "loss": 1.0718, "step": 24357 }, { "epoch": 0.73, "learning_rate": 8.730947066193016e-07, "loss": 1.0328, "step": 24358 }, { "epoch": 0.73, "learning_rate": 8.729095103397189e-07, "loss": 1.0341, "step": 24359 }, { "epoch": 0.73, "learning_rate": 8.727243295492544e-07, "loss": 0.9731, "step": 24360 }, { "epoch": 0.73, "learning_rate": 8.725391642496711e-07, "loss": 1.1266, "step": 24361 }, { "epoch": 0.73, "learning_rate": 8.723540144427306e-07, "loss": 1.0634, "step": 24362 }, { "epoch": 0.73, "learning_rate": 8.721688801301958e-07, "loss": 1.1324, "step": 24363 }, { "epoch": 0.73, "learning_rate": 8.719837613138293e-07, "loss": 1.1564, "step": 24364 }, { "epoch": 0.73, "learning_rate": 8.717986579953936e-07, "loss": 1.1588, "step": 24365 }, { "epoch": 0.73, "learning_rate": 8.716135701766501e-07, "loss": 0.9973, "step": 24366 }, { "epoch": 0.73, "learning_rate": 8.714284978593613e-07, "loss": 1.0998, "step": 24367 }, { "epoch": 0.73, "learning_rate": 8.712434410452889e-07, "loss": 1.1325, "step": 24368 }, { "epoch": 0.73, "learning_rate": 8.710583997361952e-07, "loss": 1.0598, "step": 24369 }, { "epoch": 0.73, "learning_rate": 8.708733739338401e-07, "loss": 1.0885, "step": 24370 }, { "epoch": 0.73, "learning_rate": 8.706883636399862e-07, "loss": 1.0623, "step": 24371 }, { "epoch": 0.73, "learning_rate": 8.70503368856394e-07, "loss": 1.0737, "step": 24372 }, { "epoch": 0.73, "learning_rate": 8.703183895848253e-07, "loss": 1.1202, "step": 24373 }, { "epoch": 0.73, "learning_rate": 8.701334258270413e-07, "loss": 1.2922, "step": 24374 }, { "epoch": 0.73, "learning_rate": 8.699484775848013e-07, "loss": 1.0792, "step": 24375 }, { "epoch": 0.73, "learning_rate": 8.697635448598668e-07, "loss": 1.0095, "step": 24376 }, { "epoch": 0.73, "learning_rate": 8.69578627653998e-07, "loss": 1.0151, "step": 24377 }, { "epoch": 0.73, "learning_rate": 8.693937259689567e-07, "loss": 1.0399, "step": 24378 }, { "epoch": 0.73, "learning_rate": 8.692088398065005e-07, "loss": 1.1141, "step": 24379 }, { "epoch": 0.73, "learning_rate": 8.690239691683911e-07, "loss": 1.1841, "step": 24380 }, { "epoch": 0.73, "learning_rate": 8.688391140563876e-07, "loss": 1.3054, "step": 24381 }, { "epoch": 0.73, "learning_rate": 8.686542744722512e-07, "loss": 1.2437, "step": 24382 }, { "epoch": 0.73, "learning_rate": 8.684694504177396e-07, "loss": 1.1193, "step": 24383 }, { "epoch": 0.73, "learning_rate": 8.682846418946131e-07, "loss": 1.0865, "step": 24384 }, { "epoch": 0.73, "learning_rate": 8.680998489046307e-07, "loss": 1.0424, "step": 24385 }, { "epoch": 0.73, "learning_rate": 8.679150714495522e-07, "loss": 1.1407, "step": 24386 }, { "epoch": 0.73, "learning_rate": 8.677303095311368e-07, "loss": 1.1151, "step": 24387 }, { "epoch": 0.73, "learning_rate": 8.675455631511418e-07, "loss": 1.1799, "step": 24388 }, { "epoch": 0.73, "learning_rate": 8.673608323113269e-07, "loss": 1.0214, "step": 24389 }, { "epoch": 0.73, "learning_rate": 8.671761170134505e-07, "loss": 1.0259, "step": 24390 }, { "epoch": 0.73, "learning_rate": 8.669914172592711e-07, "loss": 0.9979, "step": 24391 }, { "epoch": 0.73, "learning_rate": 8.66806733050547e-07, "loss": 1.153, "step": 24392 }, { "epoch": 0.73, "learning_rate": 8.666220643890364e-07, "loss": 1.1663, "step": 24393 }, { "epoch": 0.73, "learning_rate": 8.664374112764975e-07, "loss": 0.974, "step": 24394 }, { "epoch": 0.73, "learning_rate": 8.662527737146873e-07, "loss": 1.0746, "step": 24395 }, { "epoch": 0.73, "learning_rate": 8.660681517053634e-07, "loss": 1.0209, "step": 24396 }, { "epoch": 0.73, "learning_rate": 8.658835452502839e-07, "loss": 1.0837, "step": 24397 }, { "epoch": 0.73, "learning_rate": 8.656989543512062e-07, "loss": 1.1033, "step": 24398 }, { "epoch": 0.74, "learning_rate": 8.655143790098874e-07, "loss": 1.0912, "step": 24399 }, { "epoch": 0.74, "learning_rate": 8.653298192280851e-07, "loss": 1.1575, "step": 24400 }, { "epoch": 0.74, "learning_rate": 8.651452750075551e-07, "loss": 1.0545, "step": 24401 }, { "epoch": 0.74, "learning_rate": 8.649607463500545e-07, "loss": 1.0294, "step": 24402 }, { "epoch": 0.74, "learning_rate": 8.647762332573401e-07, "loss": 1.0322, "step": 24403 }, { "epoch": 0.74, "learning_rate": 8.645917357311693e-07, "loss": 1.0141, "step": 24404 }, { "epoch": 0.74, "learning_rate": 8.644072537732967e-07, "loss": 1.0012, "step": 24405 }, { "epoch": 0.74, "learning_rate": 8.642227873854794e-07, "loss": 1.1896, "step": 24406 }, { "epoch": 0.74, "learning_rate": 8.640383365694732e-07, "loss": 1.048, "step": 24407 }, { "epoch": 0.74, "learning_rate": 8.63853901327035e-07, "loss": 1.1642, "step": 24408 }, { "epoch": 0.74, "learning_rate": 8.63669481659919e-07, "loss": 1.0863, "step": 24409 }, { "epoch": 0.74, "learning_rate": 8.634850775698814e-07, "loss": 1.1316, "step": 24410 }, { "epoch": 0.74, "learning_rate": 8.633006890586776e-07, "loss": 1.0914, "step": 24411 }, { "epoch": 0.74, "learning_rate": 8.631163161280629e-07, "loss": 1.2688, "step": 24412 }, { "epoch": 0.74, "learning_rate": 8.629319587797935e-07, "loss": 1.1049, "step": 24413 }, { "epoch": 0.74, "learning_rate": 8.627476170156224e-07, "loss": 1.1539, "step": 24414 }, { "epoch": 0.74, "learning_rate": 8.625632908373054e-07, "loss": 1.0576, "step": 24415 }, { "epoch": 0.74, "learning_rate": 8.623789802465976e-07, "loss": 1.0611, "step": 24416 }, { "epoch": 0.74, "learning_rate": 8.621946852452539e-07, "loss": 1.12, "step": 24417 }, { "epoch": 0.74, "learning_rate": 8.62010405835027e-07, "loss": 1.106, "step": 24418 }, { "epoch": 0.74, "learning_rate": 8.618261420176724e-07, "loss": 1.2224, "step": 24419 }, { "epoch": 0.74, "learning_rate": 8.616418937949439e-07, "loss": 1.2617, "step": 24420 }, { "epoch": 0.74, "learning_rate": 8.614576611685954e-07, "loss": 1.0782, "step": 24421 }, { "epoch": 0.74, "learning_rate": 8.612734441403808e-07, "loss": 1.1162, "step": 24422 }, { "epoch": 0.74, "learning_rate": 8.610892427120541e-07, "loss": 1.2156, "step": 24423 }, { "epoch": 0.74, "learning_rate": 8.60905056885368e-07, "loss": 1.0593, "step": 24424 }, { "epoch": 0.74, "learning_rate": 8.607208866620767e-07, "loss": 1.126, "step": 24425 }, { "epoch": 0.74, "learning_rate": 8.605367320439337e-07, "loss": 1.1011, "step": 24426 }, { "epoch": 0.74, "learning_rate": 8.603525930326906e-07, "loss": 1.0679, "step": 24427 }, { "epoch": 0.74, "learning_rate": 8.601684696301014e-07, "loss": 1.1722, "step": 24428 }, { "epoch": 0.74, "learning_rate": 8.599843618379183e-07, "loss": 1.1466, "step": 24429 }, { "epoch": 0.74, "learning_rate": 8.59800269657895e-07, "loss": 1.05, "step": 24430 }, { "epoch": 0.74, "learning_rate": 8.596161930917827e-07, "loss": 1.1367, "step": 24431 }, { "epoch": 0.74, "learning_rate": 8.594321321413338e-07, "loss": 1.0908, "step": 24432 }, { "epoch": 0.74, "learning_rate": 8.592480868083011e-07, "loss": 1.0514, "step": 24433 }, { "epoch": 0.74, "learning_rate": 8.590640570944372e-07, "loss": 0.9578, "step": 24434 }, { "epoch": 0.74, "learning_rate": 8.588800430014923e-07, "loss": 1.1508, "step": 24435 }, { "epoch": 0.74, "learning_rate": 8.586960445312192e-07, "loss": 1.0342, "step": 24436 }, { "epoch": 0.74, "learning_rate": 8.58512061685369e-07, "loss": 1.21, "step": 24437 }, { "epoch": 0.74, "learning_rate": 8.583280944656936e-07, "loss": 1.1109, "step": 24438 }, { "epoch": 0.74, "learning_rate": 8.581441428739448e-07, "loss": 1.0453, "step": 24439 }, { "epoch": 0.74, "learning_rate": 8.579602069118723e-07, "loss": 1.0578, "step": 24440 }, { "epoch": 0.74, "learning_rate": 8.577762865812278e-07, "loss": 1.1439, "step": 24441 }, { "epoch": 0.74, "learning_rate": 8.575923818837619e-07, "loss": 1.1499, "step": 24442 }, { "epoch": 0.74, "learning_rate": 8.574084928212264e-07, "loss": 1.2003, "step": 24443 }, { "epoch": 0.74, "learning_rate": 8.572246193953704e-07, "loss": 0.9476, "step": 24444 }, { "epoch": 0.74, "learning_rate": 8.570407616079446e-07, "loss": 1.1616, "step": 24445 }, { "epoch": 0.74, "learning_rate": 8.568569194606996e-07, "loss": 1.1163, "step": 24446 }, { "epoch": 0.74, "learning_rate": 8.566730929553852e-07, "loss": 1.12, "step": 24447 }, { "epoch": 0.74, "learning_rate": 8.564892820937515e-07, "loss": 1.0397, "step": 24448 }, { "epoch": 0.74, "learning_rate": 8.563054868775483e-07, "loss": 1.0833, "step": 24449 }, { "epoch": 0.74, "learning_rate": 8.561217073085254e-07, "loss": 1.0683, "step": 24450 }, { "epoch": 0.74, "learning_rate": 8.559379433884321e-07, "loss": 1.1353, "step": 24451 }, { "epoch": 0.74, "learning_rate": 8.557541951190185e-07, "loss": 1.156, "step": 24452 }, { "epoch": 0.74, "learning_rate": 8.555704625020322e-07, "loss": 1.1622, "step": 24453 }, { "epoch": 0.74, "learning_rate": 8.553867455392234e-07, "loss": 1.073, "step": 24454 }, { "epoch": 0.74, "learning_rate": 8.552030442323403e-07, "loss": 1.205, "step": 24455 }, { "epoch": 0.74, "learning_rate": 8.550193585831332e-07, "loss": 1.1964, "step": 24456 }, { "epoch": 0.74, "learning_rate": 8.548356885933487e-07, "loss": 1.1366, "step": 24457 }, { "epoch": 0.74, "learning_rate": 8.54652034264736e-07, "loss": 1.069, "step": 24458 }, { "epoch": 0.74, "learning_rate": 8.544683955990435e-07, "loss": 1.1227, "step": 24459 }, { "epoch": 0.74, "learning_rate": 8.542847725980202e-07, "loss": 1.1166, "step": 24460 }, { "epoch": 0.74, "learning_rate": 8.541011652634123e-07, "loss": 1.064, "step": 24461 }, { "epoch": 0.74, "learning_rate": 8.53917573596969e-07, "loss": 1.1753, "step": 24462 }, { "epoch": 0.74, "learning_rate": 8.537339976004371e-07, "loss": 1.0731, "step": 24463 }, { "epoch": 0.74, "learning_rate": 8.535504372755659e-07, "loss": 1.1513, "step": 24464 }, { "epoch": 0.74, "learning_rate": 8.533668926241007e-07, "loss": 1.1372, "step": 24465 }, { "epoch": 0.74, "learning_rate": 8.531833636477896e-07, "loss": 1.0289, "step": 24466 }, { "epoch": 0.74, "learning_rate": 8.529998503483797e-07, "loss": 1.1176, "step": 24467 }, { "epoch": 0.74, "learning_rate": 8.528163527276182e-07, "loss": 1.0685, "step": 24468 }, { "epoch": 0.74, "learning_rate": 8.526328707872522e-07, "loss": 1.1188, "step": 24469 }, { "epoch": 0.74, "learning_rate": 8.524494045290272e-07, "loss": 1.1873, "step": 24470 }, { "epoch": 0.74, "learning_rate": 8.522659539546904e-07, "loss": 1.0604, "step": 24471 }, { "epoch": 0.74, "learning_rate": 8.520825190659882e-07, "loss": 1.097, "step": 24472 }, { "epoch": 0.74, "learning_rate": 8.518990998646664e-07, "loss": 1.05, "step": 24473 }, { "epoch": 0.74, "learning_rate": 8.51715696352472e-07, "loss": 1.0392, "step": 24474 }, { "epoch": 0.74, "learning_rate": 8.5153230853115e-07, "loss": 1.187, "step": 24475 }, { "epoch": 0.74, "learning_rate": 8.513489364024471e-07, "loss": 1.071, "step": 24476 }, { "epoch": 0.74, "learning_rate": 8.511655799681079e-07, "loss": 0.9125, "step": 24477 }, { "epoch": 0.74, "learning_rate": 8.50982239229878e-07, "loss": 1.1425, "step": 24478 }, { "epoch": 0.74, "learning_rate": 8.507989141895031e-07, "loss": 1.062, "step": 24479 }, { "epoch": 0.74, "learning_rate": 8.506156048487282e-07, "loss": 1.05, "step": 24480 }, { "epoch": 0.74, "learning_rate": 8.504323112092985e-07, "loss": 1.0884, "step": 24481 }, { "epoch": 0.74, "learning_rate": 8.502490332729596e-07, "loss": 1.0538, "step": 24482 }, { "epoch": 0.74, "learning_rate": 8.500657710414542e-07, "loss": 1.085, "step": 24483 }, { "epoch": 0.74, "learning_rate": 8.498825245165285e-07, "loss": 1.0869, "step": 24484 }, { "epoch": 0.74, "learning_rate": 8.49699293699926e-07, "loss": 1.1177, "step": 24485 }, { "epoch": 0.74, "learning_rate": 8.495160785933923e-07, "loss": 1.1487, "step": 24486 }, { "epoch": 0.74, "learning_rate": 8.493328791986699e-07, "loss": 1.0037, "step": 24487 }, { "epoch": 0.74, "learning_rate": 8.491496955175036e-07, "loss": 1.0776, "step": 24488 }, { "epoch": 0.74, "learning_rate": 8.48966527551637e-07, "loss": 1.1245, "step": 24489 }, { "epoch": 0.74, "learning_rate": 8.487833753028149e-07, "loss": 1.0972, "step": 24490 }, { "epoch": 0.74, "learning_rate": 8.486002387727788e-07, "loss": 1.1923, "step": 24491 }, { "epoch": 0.74, "learning_rate": 8.48417117963273e-07, "loss": 1.0596, "step": 24492 }, { "epoch": 0.74, "learning_rate": 8.482340128760411e-07, "loss": 1.1407, "step": 24493 }, { "epoch": 0.74, "learning_rate": 8.480509235128257e-07, "loss": 1.0828, "step": 24494 }, { "epoch": 0.74, "learning_rate": 8.478678498753707e-07, "loss": 1.1464, "step": 24495 }, { "epoch": 0.74, "learning_rate": 8.476847919654174e-07, "loss": 1.1047, "step": 24496 }, { "epoch": 0.74, "learning_rate": 8.47501749784709e-07, "loss": 1.0839, "step": 24497 }, { "epoch": 0.74, "learning_rate": 8.47318723334988e-07, "loss": 1.1356, "step": 24498 }, { "epoch": 0.74, "learning_rate": 8.471357126179977e-07, "loss": 1.0555, "step": 24499 }, { "epoch": 0.74, "learning_rate": 8.469527176354786e-07, "loss": 1.0804, "step": 24500 }, { "epoch": 0.74, "learning_rate": 8.467697383891735e-07, "loss": 1.1783, "step": 24501 }, { "epoch": 0.74, "learning_rate": 8.46586774880824e-07, "loss": 1.1053, "step": 24502 }, { "epoch": 0.74, "learning_rate": 8.464038271121724e-07, "loss": 1.0364, "step": 24503 }, { "epoch": 0.74, "learning_rate": 8.462208950849599e-07, "loss": 1.0842, "step": 24504 }, { "epoch": 0.74, "learning_rate": 8.460379788009279e-07, "loss": 1.1114, "step": 24505 }, { "epoch": 0.74, "learning_rate": 8.458550782618177e-07, "loss": 0.92, "step": 24506 }, { "epoch": 0.74, "learning_rate": 8.456721934693706e-07, "loss": 1.0173, "step": 24507 }, { "epoch": 0.74, "learning_rate": 8.454893244253284e-07, "loss": 0.9927, "step": 24508 }, { "epoch": 0.74, "learning_rate": 8.453064711314299e-07, "loss": 1.0514, "step": 24509 }, { "epoch": 0.74, "learning_rate": 8.451236335894172e-07, "loss": 1.1713, "step": 24510 }, { "epoch": 0.74, "learning_rate": 8.449408118010302e-07, "loss": 1.1207, "step": 24511 }, { "epoch": 0.74, "learning_rate": 8.447580057680105e-07, "loss": 1.1198, "step": 24512 }, { "epoch": 0.74, "learning_rate": 8.445752154920966e-07, "loss": 1.0844, "step": 24513 }, { "epoch": 0.74, "learning_rate": 8.443924409750293e-07, "loss": 1.1227, "step": 24514 }, { "epoch": 0.74, "learning_rate": 8.442096822185486e-07, "loss": 1.1868, "step": 24515 }, { "epoch": 0.74, "learning_rate": 8.440269392243952e-07, "loss": 1.2178, "step": 24516 }, { "epoch": 0.74, "learning_rate": 8.438442119943069e-07, "loss": 1.0847, "step": 24517 }, { "epoch": 0.74, "learning_rate": 8.436615005300242e-07, "loss": 1.1379, "step": 24518 }, { "epoch": 0.74, "learning_rate": 8.434788048332862e-07, "loss": 1.1143, "step": 24519 }, { "epoch": 0.74, "learning_rate": 8.432961249058321e-07, "loss": 1.1418, "step": 24520 }, { "epoch": 0.74, "learning_rate": 8.431134607494019e-07, "loss": 1.0953, "step": 24521 }, { "epoch": 0.74, "learning_rate": 8.429308123657326e-07, "loss": 1.1379, "step": 24522 }, { "epoch": 0.74, "learning_rate": 8.42748179756564e-07, "loss": 1.0389, "step": 24523 }, { "epoch": 0.74, "learning_rate": 8.425655629236346e-07, "loss": 1.1331, "step": 24524 }, { "epoch": 0.74, "learning_rate": 8.423829618686835e-07, "loss": 1.1325, "step": 24525 }, { "epoch": 0.74, "learning_rate": 8.422003765934475e-07, "loss": 1.0735, "step": 24526 }, { "epoch": 0.74, "learning_rate": 8.420178070996657e-07, "loss": 1.0702, "step": 24527 }, { "epoch": 0.74, "learning_rate": 8.418352533890756e-07, "loss": 1.2233, "step": 24528 }, { "epoch": 0.74, "learning_rate": 8.416527154634155e-07, "loss": 1.1292, "step": 24529 }, { "epoch": 0.74, "learning_rate": 8.414701933244226e-07, "loss": 1.1304, "step": 24530 }, { "epoch": 0.74, "learning_rate": 8.412876869738348e-07, "loss": 1.152, "step": 24531 }, { "epoch": 0.74, "learning_rate": 8.411051964133895e-07, "loss": 1.208, "step": 24532 }, { "epoch": 0.74, "learning_rate": 8.409227216448234e-07, "loss": 1.0924, "step": 24533 }, { "epoch": 0.74, "learning_rate": 8.407402626698752e-07, "loss": 1.2433, "step": 24534 }, { "epoch": 0.74, "learning_rate": 8.405578194902797e-07, "loss": 1.184, "step": 24535 }, { "epoch": 0.74, "learning_rate": 8.403753921077743e-07, "loss": 1.0286, "step": 24536 }, { "epoch": 0.74, "learning_rate": 8.40192980524096e-07, "loss": 1.1091, "step": 24537 }, { "epoch": 0.74, "learning_rate": 8.400105847409821e-07, "loss": 1.1066, "step": 24538 }, { "epoch": 0.74, "learning_rate": 8.398282047601669e-07, "loss": 1.1624, "step": 24539 }, { "epoch": 0.74, "learning_rate": 8.396458405833876e-07, "loss": 1.0468, "step": 24540 }, { "epoch": 0.74, "learning_rate": 8.394634922123804e-07, "loss": 1.042, "step": 24541 }, { "epoch": 0.74, "learning_rate": 8.392811596488818e-07, "loss": 1.0807, "step": 24542 }, { "epoch": 0.74, "learning_rate": 8.390988428946259e-07, "loss": 1.2085, "step": 24543 }, { "epoch": 0.74, "learning_rate": 8.38916541951349e-07, "loss": 1.1112, "step": 24544 }, { "epoch": 0.74, "learning_rate": 8.387342568207868e-07, "loss": 1.0842, "step": 24545 }, { "epoch": 0.74, "learning_rate": 8.385519875046741e-07, "loss": 1.0848, "step": 24546 }, { "epoch": 0.74, "learning_rate": 8.383697340047475e-07, "loss": 1.1502, "step": 24547 }, { "epoch": 0.74, "learning_rate": 8.381874963227396e-07, "loss": 1.1472, "step": 24548 }, { "epoch": 0.74, "learning_rate": 8.380052744603867e-07, "loss": 1.046, "step": 24549 }, { "epoch": 0.74, "learning_rate": 8.378230684194227e-07, "loss": 1.0726, "step": 24550 }, { "epoch": 0.74, "learning_rate": 8.376408782015838e-07, "loss": 1.035, "step": 24551 }, { "epoch": 0.74, "learning_rate": 8.374587038086022e-07, "loss": 1.0292, "step": 24552 }, { "epoch": 0.74, "learning_rate": 8.372765452422129e-07, "loss": 1.115, "step": 24553 }, { "epoch": 0.74, "learning_rate": 8.370944025041502e-07, "loss": 1.0109, "step": 24554 }, { "epoch": 0.74, "learning_rate": 8.369122755961479e-07, "loss": 1.2051, "step": 24555 }, { "epoch": 0.74, "learning_rate": 8.367301645199396e-07, "loss": 1.2083, "step": 24556 }, { "epoch": 0.74, "learning_rate": 8.365480692772593e-07, "loss": 1.0701, "step": 24557 }, { "epoch": 0.74, "learning_rate": 8.363659898698401e-07, "loss": 1.0588, "step": 24558 }, { "epoch": 0.74, "learning_rate": 8.361839262994165e-07, "loss": 1.076, "step": 24559 }, { "epoch": 0.74, "learning_rate": 8.360018785677195e-07, "loss": 1.1391, "step": 24560 }, { "epoch": 0.74, "learning_rate": 8.358198466764833e-07, "loss": 1.2283, "step": 24561 }, { "epoch": 0.74, "learning_rate": 8.356378306274407e-07, "loss": 1.0784, "step": 24562 }, { "epoch": 0.74, "learning_rate": 8.354558304223242e-07, "loss": 1.0969, "step": 24563 }, { "epoch": 0.74, "learning_rate": 8.352738460628676e-07, "loss": 1.1245, "step": 24564 }, { "epoch": 0.74, "learning_rate": 8.350918775508013e-07, "loss": 1.2016, "step": 24565 }, { "epoch": 0.74, "learning_rate": 8.349099248878584e-07, "loss": 1.0722, "step": 24566 }, { "epoch": 0.74, "learning_rate": 8.347279880757711e-07, "loss": 1.1699, "step": 24567 }, { "epoch": 0.74, "learning_rate": 8.345460671162723e-07, "loss": 1.1823, "step": 24568 }, { "epoch": 0.74, "learning_rate": 8.343641620110918e-07, "loss": 1.138, "step": 24569 }, { "epoch": 0.74, "learning_rate": 8.341822727619625e-07, "loss": 1.1031, "step": 24570 }, { "epoch": 0.74, "learning_rate": 8.340003993706155e-07, "loss": 1.1052, "step": 24571 }, { "epoch": 0.74, "learning_rate": 8.338185418387823e-07, "loss": 1.0768, "step": 24572 }, { "epoch": 0.74, "learning_rate": 8.33636700168195e-07, "loss": 1.1513, "step": 24573 }, { "epoch": 0.74, "learning_rate": 8.33454874360583e-07, "loss": 1.0609, "step": 24574 }, { "epoch": 0.74, "learning_rate": 8.332730644176781e-07, "loss": 1.1351, "step": 24575 }, { "epoch": 0.74, "learning_rate": 8.330912703412106e-07, "loss": 0.9837, "step": 24576 }, { "epoch": 0.74, "learning_rate": 8.329094921329123e-07, "loss": 1.0413, "step": 24577 }, { "epoch": 0.74, "learning_rate": 8.327277297945121e-07, "loss": 1.14, "step": 24578 }, { "epoch": 0.74, "learning_rate": 8.325459833277408e-07, "loss": 1.0823, "step": 24579 }, { "epoch": 0.74, "learning_rate": 8.323642527343287e-07, "loss": 1.1734, "step": 24580 }, { "epoch": 0.74, "learning_rate": 8.321825380160064e-07, "loss": 1.1536, "step": 24581 }, { "epoch": 0.74, "learning_rate": 8.320008391745025e-07, "loss": 1.1799, "step": 24582 }, { "epoch": 0.74, "learning_rate": 8.318191562115472e-07, "loss": 1.1423, "step": 24583 }, { "epoch": 0.74, "learning_rate": 8.316374891288701e-07, "loss": 1.2207, "step": 24584 }, { "epoch": 0.74, "learning_rate": 8.314558379282006e-07, "loss": 1.2458, "step": 24585 }, { "epoch": 0.74, "learning_rate": 8.312742026112678e-07, "loss": 1.067, "step": 24586 }, { "epoch": 0.74, "learning_rate": 8.310925831798011e-07, "loss": 1.0605, "step": 24587 }, { "epoch": 0.74, "learning_rate": 8.309109796355291e-07, "loss": 1.2183, "step": 24588 }, { "epoch": 0.74, "learning_rate": 8.307293919801806e-07, "loss": 1.1536, "step": 24589 }, { "epoch": 0.74, "learning_rate": 8.305478202154855e-07, "loss": 1.0141, "step": 24590 }, { "epoch": 0.74, "learning_rate": 8.3036626434317e-07, "loss": 1.2156, "step": 24591 }, { "epoch": 0.74, "learning_rate": 8.301847243649638e-07, "loss": 1.1773, "step": 24592 }, { "epoch": 0.74, "learning_rate": 8.300032002825945e-07, "loss": 1.0278, "step": 24593 }, { "epoch": 0.74, "learning_rate": 8.298216920977914e-07, "loss": 1.096, "step": 24594 }, { "epoch": 0.74, "learning_rate": 8.296401998122808e-07, "loss": 1.0823, "step": 24595 }, { "epoch": 0.74, "learning_rate": 8.294587234277906e-07, "loss": 1.095, "step": 24596 }, { "epoch": 0.74, "learning_rate": 8.292772629460491e-07, "loss": 1.0659, "step": 24597 }, { "epoch": 0.74, "learning_rate": 8.290958183687833e-07, "loss": 1.1143, "step": 24598 }, { "epoch": 0.74, "learning_rate": 8.289143896977214e-07, "loss": 1.1305, "step": 24599 }, { "epoch": 0.74, "learning_rate": 8.287329769345889e-07, "loss": 1.1992, "step": 24600 }, { "epoch": 0.74, "learning_rate": 8.285515800811137e-07, "loss": 1.0962, "step": 24601 }, { "epoch": 0.74, "learning_rate": 8.283701991390222e-07, "loss": 1.0247, "step": 24602 }, { "epoch": 0.74, "learning_rate": 8.281888341100422e-07, "loss": 1.0595, "step": 24603 }, { "epoch": 0.74, "learning_rate": 8.280074849958986e-07, "loss": 1.1261, "step": 24604 }, { "epoch": 0.74, "learning_rate": 8.278261517983185e-07, "loss": 1.0035, "step": 24605 }, { "epoch": 0.74, "learning_rate": 8.27644834519028e-07, "loss": 1.1981, "step": 24606 }, { "epoch": 0.74, "learning_rate": 8.274635331597541e-07, "loss": 1.16, "step": 24607 }, { "epoch": 0.74, "learning_rate": 8.272822477222211e-07, "loss": 1.1304, "step": 24608 }, { "epoch": 0.74, "learning_rate": 8.271009782081554e-07, "loss": 1.078, "step": 24609 }, { "epoch": 0.74, "learning_rate": 8.269197246192826e-07, "loss": 1.197, "step": 24610 }, { "epoch": 0.74, "learning_rate": 8.267384869573283e-07, "loss": 1.176, "step": 24611 }, { "epoch": 0.74, "learning_rate": 8.265572652240178e-07, "loss": 1.0749, "step": 24612 }, { "epoch": 0.74, "learning_rate": 8.263760594210762e-07, "loss": 1.1382, "step": 24613 }, { "epoch": 0.74, "learning_rate": 8.261948695502284e-07, "loss": 1.0977, "step": 24614 }, { "epoch": 0.74, "learning_rate": 8.260136956131993e-07, "loss": 1.0374, "step": 24615 }, { "epoch": 0.74, "learning_rate": 8.258325376117144e-07, "loss": 1.1804, "step": 24616 }, { "epoch": 0.74, "learning_rate": 8.256513955474968e-07, "loss": 1.1771, "step": 24617 }, { "epoch": 0.74, "learning_rate": 8.254702694222714e-07, "loss": 1.1373, "step": 24618 }, { "epoch": 0.74, "learning_rate": 8.252891592377624e-07, "loss": 1.1304, "step": 24619 }, { "epoch": 0.74, "learning_rate": 8.251080649956949e-07, "loss": 1.0309, "step": 24620 }, { "epoch": 0.74, "learning_rate": 8.249269866977913e-07, "loss": 1.0724, "step": 24621 }, { "epoch": 0.74, "learning_rate": 8.247459243457759e-07, "loss": 1.0978, "step": 24622 }, { "epoch": 0.74, "learning_rate": 8.245648779413726e-07, "loss": 1.2299, "step": 24623 }, { "epoch": 0.74, "learning_rate": 8.243838474863048e-07, "loss": 1.1565, "step": 24624 }, { "epoch": 0.74, "learning_rate": 8.242028329822966e-07, "loss": 1.1628, "step": 24625 }, { "epoch": 0.74, "learning_rate": 8.240218344310693e-07, "loss": 1.1, "step": 24626 }, { "epoch": 0.74, "learning_rate": 8.238408518343468e-07, "loss": 1.0388, "step": 24627 }, { "epoch": 0.74, "learning_rate": 8.236598851938526e-07, "loss": 1.1549, "step": 24628 }, { "epoch": 0.74, "learning_rate": 8.234789345113095e-07, "loss": 1.0367, "step": 24629 }, { "epoch": 0.74, "learning_rate": 8.232979997884389e-07, "loss": 1.1798, "step": 24630 }, { "epoch": 0.74, "learning_rate": 8.231170810269634e-07, "loss": 1.0331, "step": 24631 }, { "epoch": 0.74, "learning_rate": 8.229361782286061e-07, "loss": 1.0019, "step": 24632 }, { "epoch": 0.74, "learning_rate": 8.227552913950892e-07, "loss": 1.071, "step": 24633 }, { "epoch": 0.74, "learning_rate": 8.225744205281333e-07, "loss": 1.2103, "step": 24634 }, { "epoch": 0.74, "learning_rate": 8.223935656294612e-07, "loss": 1.0537, "step": 24635 }, { "epoch": 0.74, "learning_rate": 8.222127267007946e-07, "loss": 1.0988, "step": 24636 }, { "epoch": 0.74, "learning_rate": 8.220319037438543e-07, "loss": 1.1214, "step": 24637 }, { "epoch": 0.74, "learning_rate": 8.218510967603624e-07, "loss": 1.1797, "step": 24638 }, { "epoch": 0.74, "learning_rate": 8.216703057520401e-07, "loss": 1.1467, "step": 24639 }, { "epoch": 0.74, "learning_rate": 8.214895307206078e-07, "loss": 1.1141, "step": 24640 }, { "epoch": 0.74, "learning_rate": 8.213087716677876e-07, "loss": 0.9458, "step": 24641 }, { "epoch": 0.74, "learning_rate": 8.211280285952989e-07, "loss": 1.0098, "step": 24642 }, { "epoch": 0.74, "learning_rate": 8.209473015048625e-07, "loss": 1.0865, "step": 24643 }, { "epoch": 0.74, "learning_rate": 8.20766590398199e-07, "loss": 1.0913, "step": 24644 }, { "epoch": 0.74, "learning_rate": 8.20585895277029e-07, "loss": 1.1538, "step": 24645 }, { "epoch": 0.74, "learning_rate": 8.204052161430734e-07, "loss": 1.2142, "step": 24646 }, { "epoch": 0.74, "learning_rate": 8.202245529980505e-07, "loss": 1.16, "step": 24647 }, { "epoch": 0.74, "learning_rate": 8.200439058436804e-07, "loss": 1.2032, "step": 24648 }, { "epoch": 0.74, "learning_rate": 8.198632746816834e-07, "loss": 1.058, "step": 24649 }, { "epoch": 0.74, "learning_rate": 8.1968265951378e-07, "loss": 1.1767, "step": 24650 }, { "epoch": 0.74, "learning_rate": 8.19502060341687e-07, "loss": 1.0941, "step": 24651 }, { "epoch": 0.74, "learning_rate": 8.193214771671254e-07, "loss": 1.075, "step": 24652 }, { "epoch": 0.74, "learning_rate": 8.191409099918138e-07, "loss": 1.1549, "step": 24653 }, { "epoch": 0.74, "learning_rate": 8.189603588174713e-07, "loss": 1.1409, "step": 24654 }, { "epoch": 0.74, "learning_rate": 8.187798236458175e-07, "loss": 1.054, "step": 24655 }, { "epoch": 0.74, "learning_rate": 8.18599304478569e-07, "loss": 0.9495, "step": 24656 }, { "epoch": 0.74, "learning_rate": 8.184188013174455e-07, "loss": 1.1254, "step": 24657 }, { "epoch": 0.74, "learning_rate": 8.182383141641651e-07, "loss": 1.1172, "step": 24658 }, { "epoch": 0.74, "learning_rate": 8.180578430204467e-07, "loss": 1.1291, "step": 24659 }, { "epoch": 0.74, "learning_rate": 8.178773878880066e-07, "loss": 1.2214, "step": 24660 }, { "epoch": 0.74, "learning_rate": 8.17696948768564e-07, "loss": 1.1189, "step": 24661 }, { "epoch": 0.74, "learning_rate": 8.175165256638359e-07, "loss": 1.1634, "step": 24662 }, { "epoch": 0.74, "learning_rate": 8.173361185755412e-07, "loss": 1.0888, "step": 24663 }, { "epoch": 0.74, "learning_rate": 8.171557275053954e-07, "loss": 1.0172, "step": 24664 }, { "epoch": 0.74, "learning_rate": 8.169753524551167e-07, "loss": 1.1289, "step": 24665 }, { "epoch": 0.74, "learning_rate": 8.167949934264219e-07, "loss": 1.0341, "step": 24666 }, { "epoch": 0.74, "learning_rate": 8.166146504210281e-07, "loss": 1.1273, "step": 24667 }, { "epoch": 0.74, "learning_rate": 8.164343234406522e-07, "loss": 1.0041, "step": 24668 }, { "epoch": 0.74, "learning_rate": 8.162540124870108e-07, "loss": 1.1046, "step": 24669 }, { "epoch": 0.74, "learning_rate": 8.1607371756182e-07, "loss": 1.1652, "step": 24670 }, { "epoch": 0.74, "learning_rate": 8.158934386667966e-07, "loss": 1.0433, "step": 24671 }, { "epoch": 0.74, "learning_rate": 8.157131758036572e-07, "loss": 1.1329, "step": 24672 }, { "epoch": 0.74, "learning_rate": 8.155329289741166e-07, "loss": 1.1068, "step": 24673 }, { "epoch": 0.74, "learning_rate": 8.15352698179891e-07, "loss": 1.0967, "step": 24674 }, { "epoch": 0.74, "learning_rate": 8.151724834226965e-07, "loss": 1.1478, "step": 24675 }, { "epoch": 0.74, "learning_rate": 8.149922847042493e-07, "loss": 1.0644, "step": 24676 }, { "epoch": 0.74, "learning_rate": 8.148121020262634e-07, "loss": 1.0728, "step": 24677 }, { "epoch": 0.74, "learning_rate": 8.146319353904545e-07, "loss": 1.0644, "step": 24678 }, { "epoch": 0.74, "learning_rate": 8.144517847985378e-07, "loss": 1.1104, "step": 24679 }, { "epoch": 0.74, "learning_rate": 8.142716502522283e-07, "loss": 1.2894, "step": 24680 }, { "epoch": 0.74, "learning_rate": 8.140915317532419e-07, "loss": 1.162, "step": 24681 }, { "epoch": 0.74, "learning_rate": 8.13911429303291e-07, "loss": 1.1441, "step": 24682 }, { "epoch": 0.74, "learning_rate": 8.137313429040916e-07, "loss": 1.2173, "step": 24683 }, { "epoch": 0.74, "learning_rate": 8.135512725573574e-07, "loss": 1.1066, "step": 24684 }, { "epoch": 0.74, "learning_rate": 8.133712182648038e-07, "loss": 1.174, "step": 24685 }, { "epoch": 0.74, "learning_rate": 8.131911800281431e-07, "loss": 1.201, "step": 24686 }, { "epoch": 0.74, "learning_rate": 8.130111578490899e-07, "loss": 1.0496, "step": 24687 }, { "epoch": 0.74, "learning_rate": 8.12831151729358e-07, "loss": 1.2411, "step": 24688 }, { "epoch": 0.74, "learning_rate": 8.126511616706617e-07, "loss": 1.1139, "step": 24689 }, { "epoch": 0.74, "learning_rate": 8.124711876747129e-07, "loss": 1.0851, "step": 24690 }, { "epoch": 0.74, "learning_rate": 8.122912297432259e-07, "loss": 1.1113, "step": 24691 }, { "epoch": 0.74, "learning_rate": 8.121112878779133e-07, "loss": 1.147, "step": 24692 }, { "epoch": 0.74, "learning_rate": 8.119313620804886e-07, "loss": 1.229, "step": 24693 }, { "epoch": 0.74, "learning_rate": 8.11751452352664e-07, "loss": 1.1057, "step": 24694 }, { "epoch": 0.74, "learning_rate": 8.115715586961526e-07, "loss": 1.068, "step": 24695 }, { "epoch": 0.74, "learning_rate": 8.113916811126668e-07, "loss": 1.0366, "step": 24696 }, { "epoch": 0.74, "learning_rate": 8.11211819603919e-07, "loss": 1.0895, "step": 24697 }, { "epoch": 0.74, "learning_rate": 8.110319741716222e-07, "loss": 1.0544, "step": 24698 }, { "epoch": 0.74, "learning_rate": 8.108521448174866e-07, "loss": 1.2122, "step": 24699 }, { "epoch": 0.74, "learning_rate": 8.106723315432252e-07, "loss": 1.105, "step": 24700 }, { "epoch": 0.74, "learning_rate": 8.104925343505493e-07, "loss": 1.0658, "step": 24701 }, { "epoch": 0.74, "learning_rate": 8.10312753241172e-07, "loss": 1.1724, "step": 24702 }, { "epoch": 0.74, "learning_rate": 8.101329882168024e-07, "loss": 1.0802, "step": 24703 }, { "epoch": 0.74, "learning_rate": 8.099532392791529e-07, "loss": 1.0234, "step": 24704 }, { "epoch": 0.74, "learning_rate": 8.097735064299348e-07, "loss": 1.1655, "step": 24705 }, { "epoch": 0.74, "learning_rate": 8.095937896708588e-07, "loss": 1.2166, "step": 24706 }, { "epoch": 0.74, "learning_rate": 8.094140890036364e-07, "loss": 1.0361, "step": 24707 }, { "epoch": 0.74, "learning_rate": 8.092344044299771e-07, "loss": 1.0545, "step": 24708 }, { "epoch": 0.74, "learning_rate": 8.090547359515919e-07, "loss": 1.0544, "step": 24709 }, { "epoch": 0.74, "learning_rate": 8.088750835701912e-07, "loss": 1.1125, "step": 24710 }, { "epoch": 0.74, "learning_rate": 8.086954472874861e-07, "loss": 1.0974, "step": 24711 }, { "epoch": 0.74, "learning_rate": 8.085158271051849e-07, "loss": 1.0858, "step": 24712 }, { "epoch": 0.74, "learning_rate": 8.083362230249983e-07, "loss": 1.1219, "step": 24713 }, { "epoch": 0.74, "learning_rate": 8.081566350486364e-07, "loss": 1.095, "step": 24714 }, { "epoch": 0.74, "learning_rate": 8.079770631778092e-07, "loss": 1.0604, "step": 24715 }, { "epoch": 0.74, "learning_rate": 8.077975074142244e-07, "loss": 1.1328, "step": 24716 }, { "epoch": 0.74, "learning_rate": 8.076179677595927e-07, "loss": 1.1045, "step": 24717 }, { "epoch": 0.74, "learning_rate": 8.074384442156227e-07, "loss": 1.2075, "step": 24718 }, { "epoch": 0.74, "learning_rate": 8.072589367840236e-07, "loss": 1.1296, "step": 24719 }, { "epoch": 0.74, "learning_rate": 8.07079445466504e-07, "loss": 1.1022, "step": 24720 }, { "epoch": 0.74, "learning_rate": 8.068999702647728e-07, "loss": 1.0016, "step": 24721 }, { "epoch": 0.74, "learning_rate": 8.067205111805384e-07, "loss": 1.2323, "step": 24722 }, { "epoch": 0.74, "learning_rate": 8.065410682155103e-07, "loss": 1.1415, "step": 24723 }, { "epoch": 0.74, "learning_rate": 8.063616413713945e-07, "loss": 1.0684, "step": 24724 }, { "epoch": 0.74, "learning_rate": 8.061822306499007e-07, "loss": 1.2753, "step": 24725 }, { "epoch": 0.74, "learning_rate": 8.060028360527359e-07, "loss": 1.1539, "step": 24726 }, { "epoch": 0.74, "learning_rate": 8.058234575816082e-07, "loss": 1.1266, "step": 24727 }, { "epoch": 0.74, "learning_rate": 8.05644095238226e-07, "loss": 1.0786, "step": 24728 }, { "epoch": 0.74, "learning_rate": 8.054647490242953e-07, "loss": 1.048, "step": 24729 }, { "epoch": 0.74, "learning_rate": 8.052854189415243e-07, "loss": 1.0671, "step": 24730 }, { "epoch": 0.75, "learning_rate": 8.051061049916198e-07, "loss": 1.1596, "step": 24731 }, { "epoch": 0.75, "learning_rate": 8.049268071762886e-07, "loss": 1.1091, "step": 24732 }, { "epoch": 0.75, "learning_rate": 8.04747525497239e-07, "loss": 1.136, "step": 24733 }, { "epoch": 0.75, "learning_rate": 8.045682599561755e-07, "loss": 1.0074, "step": 24734 }, { "epoch": 0.75, "learning_rate": 8.043890105548055e-07, "loss": 1.136, "step": 24735 }, { "epoch": 0.75, "learning_rate": 8.042097772948357e-07, "loss": 1.0746, "step": 24736 }, { "epoch": 0.75, "learning_rate": 8.040305601779727e-07, "loss": 1.1553, "step": 24737 }, { "epoch": 0.75, "learning_rate": 8.038513592059213e-07, "loss": 1.1393, "step": 24738 }, { "epoch": 0.75, "learning_rate": 8.03672174380388e-07, "loss": 1.0756, "step": 24739 }, { "epoch": 0.75, "learning_rate": 8.034930057030788e-07, "loss": 1.1235, "step": 24740 }, { "epoch": 0.75, "learning_rate": 8.033138531756998e-07, "loss": 0.9929, "step": 24741 }, { "epoch": 0.75, "learning_rate": 8.031347167999548e-07, "loss": 1.2403, "step": 24742 }, { "epoch": 0.75, "learning_rate": 8.029555965775504e-07, "loss": 1.0282, "step": 24743 }, { "epoch": 0.75, "learning_rate": 8.02776492510191e-07, "loss": 1.1538, "step": 24744 }, { "epoch": 0.75, "learning_rate": 8.025974045995822e-07, "loss": 1.0918, "step": 24745 }, { "epoch": 0.75, "learning_rate": 8.024183328474294e-07, "loss": 1.0217, "step": 24746 }, { "epoch": 0.75, "learning_rate": 8.022392772554358e-07, "loss": 1.1326, "step": 24747 }, { "epoch": 0.75, "learning_rate": 8.020602378253064e-07, "loss": 1.1895, "step": 24748 }, { "epoch": 0.75, "learning_rate": 8.01881214558746e-07, "loss": 1.0988, "step": 24749 }, { "epoch": 0.75, "learning_rate": 8.017022074574585e-07, "loss": 0.9666, "step": 24750 }, { "epoch": 0.75, "learning_rate": 8.015232165231479e-07, "loss": 1.1589, "step": 24751 }, { "epoch": 0.75, "learning_rate": 8.013442417575184e-07, "loss": 1.0751, "step": 24752 }, { "epoch": 0.75, "learning_rate": 8.011652831622735e-07, "loss": 1.0298, "step": 24753 }, { "epoch": 0.75, "learning_rate": 8.00986340739118e-07, "loss": 1.1941, "step": 24754 }, { "epoch": 0.75, "learning_rate": 8.008074144897532e-07, "loss": 1.2192, "step": 24755 }, { "epoch": 0.75, "learning_rate": 8.006285044158835e-07, "loss": 1.2432, "step": 24756 }, { "epoch": 0.75, "learning_rate": 8.00449610519212e-07, "loss": 1.1302, "step": 24757 }, { "epoch": 0.75, "learning_rate": 8.002707328014417e-07, "loss": 1.0853, "step": 24758 }, { "epoch": 0.75, "learning_rate": 8.000918712642763e-07, "loss": 1.1115, "step": 24759 }, { "epoch": 0.75, "learning_rate": 7.999130259094168e-07, "loss": 1.1368, "step": 24760 }, { "epoch": 0.75, "learning_rate": 7.997341967385664e-07, "loss": 1.2343, "step": 24761 }, { "epoch": 0.75, "learning_rate": 7.995553837534275e-07, "loss": 1.2468, "step": 24762 }, { "epoch": 0.75, "learning_rate": 7.993765869557033e-07, "loss": 1.0437, "step": 24763 }, { "epoch": 0.75, "learning_rate": 7.99197806347094e-07, "loss": 1.1016, "step": 24764 }, { "epoch": 0.75, "learning_rate": 7.990190419293025e-07, "loss": 1.0708, "step": 24765 }, { "epoch": 0.75, "learning_rate": 7.988402937040307e-07, "loss": 1.1339, "step": 24766 }, { "epoch": 0.75, "learning_rate": 7.986615616729807e-07, "loss": 1.1161, "step": 24767 }, { "epoch": 0.75, "learning_rate": 7.984828458378522e-07, "loss": 1.083, "step": 24768 }, { "epoch": 0.75, "learning_rate": 7.983041462003477e-07, "loss": 1.1143, "step": 24769 }, { "epoch": 0.75, "learning_rate": 7.981254627621682e-07, "loss": 1.0918, "step": 24770 }, { "epoch": 0.75, "learning_rate": 7.979467955250148e-07, "loss": 1.1533, "step": 24771 }, { "epoch": 0.75, "learning_rate": 7.977681444905885e-07, "loss": 1.1568, "step": 24772 }, { "epoch": 0.75, "learning_rate": 7.975895096605893e-07, "loss": 1.075, "step": 24773 }, { "epoch": 0.75, "learning_rate": 7.974108910367179e-07, "loss": 1.0854, "step": 24774 }, { "epoch": 0.75, "learning_rate": 7.972322886206748e-07, "loss": 1.0411, "step": 24775 }, { "epoch": 0.75, "learning_rate": 7.970537024141603e-07, "loss": 1.0669, "step": 24776 }, { "epoch": 0.75, "learning_rate": 7.968751324188743e-07, "loss": 1.0648, "step": 24777 }, { "epoch": 0.75, "learning_rate": 7.966965786365169e-07, "loss": 1.0878, "step": 24778 }, { "epoch": 0.75, "learning_rate": 7.965180410687876e-07, "loss": 1.0808, "step": 24779 }, { "epoch": 0.75, "learning_rate": 7.96339519717387e-07, "loss": 1.0986, "step": 24780 }, { "epoch": 0.75, "learning_rate": 7.961610145840126e-07, "loss": 1.1115, "step": 24781 }, { "epoch": 0.75, "learning_rate": 7.959825256703652e-07, "loss": 1.0697, "step": 24782 }, { "epoch": 0.75, "learning_rate": 7.958040529781433e-07, "loss": 1.0372, "step": 24783 }, { "epoch": 0.75, "learning_rate": 7.956255965090459e-07, "loss": 1.0574, "step": 24784 }, { "epoch": 0.75, "learning_rate": 7.954471562647729e-07, "loss": 1.1423, "step": 24785 }, { "epoch": 0.75, "learning_rate": 7.952687322470212e-07, "loss": 1.1792, "step": 24786 }, { "epoch": 0.75, "learning_rate": 7.950903244574901e-07, "loss": 1.0634, "step": 24787 }, { "epoch": 0.75, "learning_rate": 7.94911932897878e-07, "loss": 1.2295, "step": 24788 }, { "epoch": 0.75, "learning_rate": 7.947335575698839e-07, "loss": 1.0454, "step": 24789 }, { "epoch": 0.75, "learning_rate": 7.945551984752042e-07, "loss": 1.1255, "step": 24790 }, { "epoch": 0.75, "learning_rate": 7.943768556155379e-07, "loss": 1.0123, "step": 24791 }, { "epoch": 0.75, "learning_rate": 7.941985289925821e-07, "loss": 1.1466, "step": 24792 }, { "epoch": 0.75, "learning_rate": 7.940202186080359e-07, "loss": 1.152, "step": 24793 }, { "epoch": 0.75, "learning_rate": 7.938419244635947e-07, "loss": 1.0667, "step": 24794 }, { "epoch": 0.75, "learning_rate": 7.936636465609565e-07, "loss": 1.1233, "step": 24795 }, { "epoch": 0.75, "learning_rate": 7.934853849018188e-07, "loss": 1.1295, "step": 24796 }, { "epoch": 0.75, "learning_rate": 7.933071394878783e-07, "loss": 0.9851, "step": 24797 }, { "epoch": 0.75, "learning_rate": 7.931289103208326e-07, "loss": 1.1967, "step": 24798 }, { "epoch": 0.75, "learning_rate": 7.929506974023768e-07, "loss": 1.1644, "step": 24799 }, { "epoch": 0.75, "learning_rate": 7.927725007342082e-07, "loss": 1.1538, "step": 24800 }, { "epoch": 0.75, "learning_rate": 7.925943203180234e-07, "loss": 1.2374, "step": 24801 }, { "epoch": 0.75, "learning_rate": 7.92416156155518e-07, "loss": 1.0988, "step": 24802 }, { "epoch": 0.75, "learning_rate": 7.922380082483885e-07, "loss": 1.0359, "step": 24803 }, { "epoch": 0.75, "learning_rate": 7.920598765983309e-07, "loss": 1.026, "step": 24804 }, { "epoch": 0.75, "learning_rate": 7.918817612070406e-07, "loss": 1.0751, "step": 24805 }, { "epoch": 0.75, "learning_rate": 7.917036620762139e-07, "loss": 1.0949, "step": 24806 }, { "epoch": 0.75, "learning_rate": 7.915255792075449e-07, "loss": 1.0595, "step": 24807 }, { "epoch": 0.75, "learning_rate": 7.913475126027295e-07, "loss": 1.0552, "step": 24808 }, { "epoch": 0.75, "learning_rate": 7.91169462263463e-07, "loss": 1.0448, "step": 24809 }, { "epoch": 0.75, "learning_rate": 7.909914281914402e-07, "loss": 1.1355, "step": 24810 }, { "epoch": 0.75, "learning_rate": 7.908134103883566e-07, "loss": 1.2018, "step": 24811 }, { "epoch": 0.75, "learning_rate": 7.906354088559054e-07, "loss": 1.1048, "step": 24812 }, { "epoch": 0.75, "learning_rate": 7.904574235957821e-07, "loss": 1.0656, "step": 24813 }, { "epoch": 0.75, "learning_rate": 7.902794546096803e-07, "loss": 1.0304, "step": 24814 }, { "epoch": 0.75, "learning_rate": 7.901015018992958e-07, "loss": 1.0623, "step": 24815 }, { "epoch": 0.75, "learning_rate": 7.899235654663206e-07, "loss": 1.1229, "step": 24816 }, { "epoch": 0.75, "learning_rate": 7.897456453124497e-07, "loss": 1.1682, "step": 24817 }, { "epoch": 0.75, "learning_rate": 7.895677414393762e-07, "loss": 1.1424, "step": 24818 }, { "epoch": 0.75, "learning_rate": 7.893898538487948e-07, "loss": 1.0054, "step": 24819 }, { "epoch": 0.75, "learning_rate": 7.892119825423977e-07, "loss": 1.0709, "step": 24820 }, { "epoch": 0.75, "learning_rate": 7.890341275218783e-07, "loss": 1.0952, "step": 24821 }, { "epoch": 0.75, "learning_rate": 7.888562887889301e-07, "loss": 1.0911, "step": 24822 }, { "epoch": 0.75, "learning_rate": 7.88678466345246e-07, "loss": 1.1238, "step": 24823 }, { "epoch": 0.75, "learning_rate": 7.885006601925194e-07, "loss": 1.0333, "step": 24824 }, { "epoch": 0.75, "learning_rate": 7.883228703324414e-07, "loss": 1.2443, "step": 24825 }, { "epoch": 0.75, "learning_rate": 7.881450967667051e-07, "loss": 1.0118, "step": 24826 }, { "epoch": 0.75, "learning_rate": 7.879673394970034e-07, "loss": 1.1, "step": 24827 }, { "epoch": 0.75, "learning_rate": 7.877895985250286e-07, "loss": 1.1361, "step": 24828 }, { "epoch": 0.75, "learning_rate": 7.876118738524716e-07, "loss": 1.1304, "step": 24829 }, { "epoch": 0.75, "learning_rate": 7.874341654810247e-07, "loss": 1.2027, "step": 24830 }, { "epoch": 0.75, "learning_rate": 7.872564734123797e-07, "loss": 1.0851, "step": 24831 }, { "epoch": 0.75, "learning_rate": 7.870787976482283e-07, "loss": 1.142, "step": 24832 }, { "epoch": 0.75, "learning_rate": 7.869011381902616e-07, "loss": 1.1089, "step": 24833 }, { "epoch": 0.75, "learning_rate": 7.867234950401714e-07, "loss": 1.0687, "step": 24834 }, { "epoch": 0.75, "learning_rate": 7.86545868199648e-07, "loss": 0.9752, "step": 24835 }, { "epoch": 0.75, "learning_rate": 7.863682576703837e-07, "loss": 1.2776, "step": 24836 }, { "epoch": 0.75, "learning_rate": 7.861906634540676e-07, "loss": 1.0105, "step": 24837 }, { "epoch": 0.75, "learning_rate": 7.860130855523906e-07, "loss": 1.2114, "step": 24838 }, { "epoch": 0.75, "learning_rate": 7.858355239670437e-07, "loss": 1.2103, "step": 24839 }, { "epoch": 0.75, "learning_rate": 7.856579786997174e-07, "loss": 1.1058, "step": 24840 }, { "epoch": 0.75, "learning_rate": 7.854804497521018e-07, "loss": 1.168, "step": 24841 }, { "epoch": 0.75, "learning_rate": 7.85302937125886e-07, "loss": 1.136, "step": 24842 }, { "epoch": 0.75, "learning_rate": 7.851254408227604e-07, "loss": 1.1005, "step": 24843 }, { "epoch": 0.75, "learning_rate": 7.849479608444147e-07, "loss": 1.1427, "step": 24844 }, { "epoch": 0.75, "learning_rate": 7.847704971925391e-07, "loss": 1.0336, "step": 24845 }, { "epoch": 0.75, "learning_rate": 7.845930498688214e-07, "loss": 1.1758, "step": 24846 }, { "epoch": 0.75, "learning_rate": 7.844156188749519e-07, "loss": 1.1436, "step": 24847 }, { "epoch": 0.75, "learning_rate": 7.842382042126195e-07, "loss": 1.1625, "step": 24848 }, { "epoch": 0.75, "learning_rate": 7.840608058835139e-07, "loss": 1.0709, "step": 24849 }, { "epoch": 0.75, "learning_rate": 7.838834238893219e-07, "loss": 1.0252, "step": 24850 }, { "epoch": 0.75, "learning_rate": 7.837060582317336e-07, "loss": 1.1369, "step": 24851 }, { "epoch": 0.75, "learning_rate": 7.835287089124366e-07, "loss": 1.0841, "step": 24852 }, { "epoch": 0.75, "learning_rate": 7.833513759331199e-07, "loss": 1.1033, "step": 24853 }, { "epoch": 0.75, "learning_rate": 7.83174059295472e-07, "loss": 1.2079, "step": 24854 }, { "epoch": 0.75, "learning_rate": 7.829967590011794e-07, "loss": 1.1799, "step": 24855 }, { "epoch": 0.75, "learning_rate": 7.828194750519308e-07, "loss": 1.1417, "step": 24856 }, { "epoch": 0.75, "learning_rate": 7.826422074494139e-07, "loss": 1.1572, "step": 24857 }, { "epoch": 0.75, "learning_rate": 7.824649561953157e-07, "loss": 1.2051, "step": 24858 }, { "epoch": 0.75, "learning_rate": 7.822877212913243e-07, "loss": 0.9704, "step": 24859 }, { "epoch": 0.75, "learning_rate": 7.821105027391262e-07, "loss": 1.0507, "step": 24860 }, { "epoch": 0.75, "learning_rate": 7.819333005404089e-07, "loss": 1.1336, "step": 24861 }, { "epoch": 0.75, "learning_rate": 7.8175611469686e-07, "loss": 1.0944, "step": 24862 }, { "epoch": 0.75, "learning_rate": 7.815789452101647e-07, "loss": 1.183, "step": 24863 }, { "epoch": 0.75, "learning_rate": 7.814017920820099e-07, "loss": 1.1011, "step": 24864 }, { "epoch": 0.75, "learning_rate": 7.812246553140824e-07, "loss": 1.0948, "step": 24865 }, { "epoch": 0.75, "learning_rate": 7.810475349080684e-07, "loss": 1.1147, "step": 24866 }, { "epoch": 0.75, "learning_rate": 7.808704308656548e-07, "loss": 1.1943, "step": 24867 }, { "epoch": 0.75, "learning_rate": 7.806933431885261e-07, "loss": 1.152, "step": 24868 }, { "epoch": 0.75, "learning_rate": 7.805162718783684e-07, "loss": 1.0581, "step": 24869 }, { "epoch": 0.75, "learning_rate": 7.803392169368679e-07, "loss": 1.183, "step": 24870 }, { "epoch": 0.75, "learning_rate": 7.801621783657107e-07, "loss": 1.1246, "step": 24871 }, { "epoch": 0.75, "learning_rate": 7.799851561665802e-07, "loss": 1.1357, "step": 24872 }, { "epoch": 0.75, "learning_rate": 7.798081503411628e-07, "loss": 1.0236, "step": 24873 }, { "epoch": 0.75, "learning_rate": 7.796311608911433e-07, "loss": 1.201, "step": 24874 }, { "epoch": 0.75, "learning_rate": 7.794541878182074e-07, "loss": 1.1196, "step": 24875 }, { "epoch": 0.75, "learning_rate": 7.792772311240382e-07, "loss": 1.052, "step": 24876 }, { "epoch": 0.75, "learning_rate": 7.791002908103209e-07, "loss": 1.1185, "step": 24877 }, { "epoch": 0.75, "learning_rate": 7.789233668787402e-07, "loss": 1.1141, "step": 24878 }, { "epoch": 0.75, "learning_rate": 7.787464593309802e-07, "loss": 1.0453, "step": 24879 }, { "epoch": 0.75, "learning_rate": 7.785695681687256e-07, "loss": 1.1324, "step": 24880 }, { "epoch": 0.75, "learning_rate": 7.783926933936589e-07, "loss": 1.1254, "step": 24881 }, { "epoch": 0.75, "learning_rate": 7.782158350074646e-07, "loss": 1.0955, "step": 24882 }, { "epoch": 0.75, "learning_rate": 7.780389930118263e-07, "loss": 1.0503, "step": 24883 }, { "epoch": 0.75, "learning_rate": 7.778621674084275e-07, "loss": 0.9386, "step": 24884 }, { "epoch": 0.75, "learning_rate": 7.776853581989513e-07, "loss": 1.1751, "step": 24885 }, { "epoch": 0.75, "learning_rate": 7.775085653850811e-07, "loss": 1.2206, "step": 24886 }, { "epoch": 0.75, "learning_rate": 7.773317889684998e-07, "loss": 1.1118, "step": 24887 }, { "epoch": 0.75, "learning_rate": 7.771550289508908e-07, "loss": 0.9788, "step": 24888 }, { "epoch": 0.75, "learning_rate": 7.769782853339356e-07, "loss": 1.0781, "step": 24889 }, { "epoch": 0.75, "learning_rate": 7.768015581193173e-07, "loss": 1.1593, "step": 24890 }, { "epoch": 0.75, "learning_rate": 7.766248473087179e-07, "loss": 1.0792, "step": 24891 }, { "epoch": 0.75, "learning_rate": 7.764481529038203e-07, "loss": 1.0192, "step": 24892 }, { "epoch": 0.75, "learning_rate": 7.762714749063069e-07, "loss": 1.1699, "step": 24893 }, { "epoch": 0.75, "learning_rate": 7.760948133178581e-07, "loss": 1.2204, "step": 24894 }, { "epoch": 0.75, "learning_rate": 7.759181681401564e-07, "loss": 1.1696, "step": 24895 }, { "epoch": 0.75, "learning_rate": 7.757415393748835e-07, "loss": 1.0314, "step": 24896 }, { "epoch": 0.75, "learning_rate": 7.755649270237214e-07, "loss": 1.0972, "step": 24897 }, { "epoch": 0.75, "learning_rate": 7.753883310883498e-07, "loss": 1.0564, "step": 24898 }, { "epoch": 0.75, "learning_rate": 7.752117515704507e-07, "loss": 1.062, "step": 24899 }, { "epoch": 0.75, "learning_rate": 7.750351884717053e-07, "loss": 1.2058, "step": 24900 }, { "epoch": 0.75, "learning_rate": 7.748586417937948e-07, "loss": 1.096, "step": 24901 }, { "epoch": 0.75, "learning_rate": 7.746821115383982e-07, "loss": 1.1099, "step": 24902 }, { "epoch": 0.75, "learning_rate": 7.745055977071972e-07, "loss": 1.0604, "step": 24903 }, { "epoch": 0.75, "learning_rate": 7.743291003018716e-07, "loss": 1.1945, "step": 24904 }, { "epoch": 0.75, "learning_rate": 7.741526193241022e-07, "loss": 1.0536, "step": 24905 }, { "epoch": 0.75, "learning_rate": 7.739761547755692e-07, "loss": 1.1153, "step": 24906 }, { "epoch": 0.75, "learning_rate": 7.737997066579512e-07, "loss": 1.2324, "step": 24907 }, { "epoch": 0.75, "learning_rate": 7.736232749729287e-07, "loss": 1.1049, "step": 24908 }, { "epoch": 0.75, "learning_rate": 7.734468597221812e-07, "loss": 0.9598, "step": 24909 }, { "epoch": 0.75, "learning_rate": 7.732704609073885e-07, "loss": 1.1047, "step": 24910 }, { "epoch": 0.75, "learning_rate": 7.73094078530229e-07, "loss": 1.1052, "step": 24911 }, { "epoch": 0.75, "learning_rate": 7.72917712592382e-07, "loss": 1.2242, "step": 24912 }, { "epoch": 0.75, "learning_rate": 7.727413630955266e-07, "loss": 1.046, "step": 24913 }, { "epoch": 0.75, "learning_rate": 7.725650300413415e-07, "loss": 1.053, "step": 24914 }, { "epoch": 0.75, "learning_rate": 7.723887134315055e-07, "loss": 1.0418, "step": 24915 }, { "epoch": 0.75, "learning_rate": 7.722124132676967e-07, "loss": 1.1447, "step": 24916 }, { "epoch": 0.75, "learning_rate": 7.720361295515937e-07, "loss": 1.1209, "step": 24917 }, { "epoch": 0.75, "learning_rate": 7.718598622848747e-07, "loss": 1.0554, "step": 24918 }, { "epoch": 0.75, "learning_rate": 7.71683611469218e-07, "loss": 1.2069, "step": 24919 }, { "epoch": 0.75, "learning_rate": 7.715073771063003e-07, "loss": 1.1453, "step": 24920 }, { "epoch": 0.75, "learning_rate": 7.713311591977999e-07, "loss": 1.0656, "step": 24921 }, { "epoch": 0.75, "learning_rate": 7.711549577453945e-07, "loss": 1.0496, "step": 24922 }, { "epoch": 0.75, "learning_rate": 7.709787727507617e-07, "loss": 1.1512, "step": 24923 }, { "epoch": 0.75, "learning_rate": 7.708026042155775e-07, "loss": 1.158, "step": 24924 }, { "epoch": 0.75, "learning_rate": 7.706264521415199e-07, "loss": 1.1022, "step": 24925 }, { "epoch": 0.75, "learning_rate": 7.704503165302654e-07, "loss": 1.1036, "step": 24926 }, { "epoch": 0.75, "learning_rate": 7.702741973834918e-07, "loss": 1.1066, "step": 24927 }, { "epoch": 0.75, "learning_rate": 7.700980947028741e-07, "loss": 1.1717, "step": 24928 }, { "epoch": 0.75, "learning_rate": 7.699220084900891e-07, "loss": 1.1087, "step": 24929 }, { "epoch": 0.75, "learning_rate": 7.697459387468137e-07, "loss": 1.1228, "step": 24930 }, { "epoch": 0.75, "learning_rate": 7.695698854747232e-07, "loss": 0.9747, "step": 24931 }, { "epoch": 0.75, "learning_rate": 7.693938486754951e-07, "loss": 1.0373, "step": 24932 }, { "epoch": 0.75, "learning_rate": 7.692178283508034e-07, "loss": 1.04, "step": 24933 }, { "epoch": 0.75, "learning_rate": 7.690418245023241e-07, "loss": 1.1186, "step": 24934 }, { "epoch": 0.75, "learning_rate": 7.688658371317331e-07, "loss": 1.0955, "step": 24935 }, { "epoch": 0.75, "learning_rate": 7.686898662407064e-07, "loss": 1.1151, "step": 24936 }, { "epoch": 0.75, "learning_rate": 7.685139118309173e-07, "loss": 1.2408, "step": 24937 }, { "epoch": 0.75, "learning_rate": 7.683379739040422e-07, "loss": 0.9514, "step": 24938 }, { "epoch": 0.75, "learning_rate": 7.681620524617556e-07, "loss": 1.1348, "step": 24939 }, { "epoch": 0.75, "learning_rate": 7.679861475057319e-07, "loss": 1.0197, "step": 24940 }, { "epoch": 0.75, "learning_rate": 7.67810259037646e-07, "loss": 1.0432, "step": 24941 }, { "epoch": 0.75, "learning_rate": 7.676343870591723e-07, "loss": 1.1106, "step": 24942 }, { "epoch": 0.75, "learning_rate": 7.674585315719848e-07, "loss": 1.181, "step": 24943 }, { "epoch": 0.75, "learning_rate": 7.672826925777576e-07, "loss": 1.1111, "step": 24944 }, { "epoch": 0.75, "learning_rate": 7.671068700781655e-07, "loss": 1.1812, "step": 24945 }, { "epoch": 0.75, "learning_rate": 7.669310640748808e-07, "loss": 1.152, "step": 24946 }, { "epoch": 0.75, "learning_rate": 7.667552745695775e-07, "loss": 1.0615, "step": 24947 }, { "epoch": 0.75, "learning_rate": 7.665795015639293e-07, "loss": 1.1146, "step": 24948 }, { "epoch": 0.75, "learning_rate": 7.664037450596102e-07, "loss": 1.1119, "step": 24949 }, { "epoch": 0.75, "learning_rate": 7.662280050582916e-07, "loss": 1.167, "step": 24950 }, { "epoch": 0.75, "learning_rate": 7.660522815616475e-07, "loss": 1.0126, "step": 24951 }, { "epoch": 0.75, "learning_rate": 7.658765745713506e-07, "loss": 1.0218, "step": 24952 }, { "epoch": 0.75, "learning_rate": 7.657008840890743e-07, "loss": 0.9902, "step": 24953 }, { "epoch": 0.75, "learning_rate": 7.655252101164895e-07, "loss": 1.2236, "step": 24954 }, { "epoch": 0.75, "learning_rate": 7.653495526552693e-07, "loss": 1.1389, "step": 24955 }, { "epoch": 0.75, "learning_rate": 7.651739117070859e-07, "loss": 1.1033, "step": 24956 }, { "epoch": 0.75, "learning_rate": 7.649982872736115e-07, "loss": 1.1358, "step": 24957 }, { "epoch": 0.75, "learning_rate": 7.648226793565184e-07, "loss": 1.0772, "step": 24958 }, { "epoch": 0.75, "learning_rate": 7.646470879574771e-07, "loss": 1.0408, "step": 24959 }, { "epoch": 0.75, "learning_rate": 7.644715130781596e-07, "loss": 1.0389, "step": 24960 }, { "epoch": 0.75, "learning_rate": 7.642959547202375e-07, "loss": 1.1245, "step": 24961 }, { "epoch": 0.75, "learning_rate": 7.641204128853827e-07, "loss": 1.2321, "step": 24962 }, { "epoch": 0.75, "learning_rate": 7.639448875752647e-07, "loss": 1.0616, "step": 24963 }, { "epoch": 0.75, "learning_rate": 7.637693787915553e-07, "loss": 1.0983, "step": 24964 }, { "epoch": 0.75, "learning_rate": 7.635938865359255e-07, "loss": 1.1172, "step": 24965 }, { "epoch": 0.75, "learning_rate": 7.634184108100454e-07, "loss": 1.0328, "step": 24966 }, { "epoch": 0.75, "learning_rate": 7.632429516155856e-07, "loss": 1.1804, "step": 24967 }, { "epoch": 0.75, "learning_rate": 7.630675089542166e-07, "loss": 1.1219, "step": 24968 }, { "epoch": 0.75, "learning_rate": 7.628920828276082e-07, "loss": 1.0021, "step": 24969 }, { "epoch": 0.75, "learning_rate": 7.627166732374313e-07, "loss": 1.0443, "step": 24970 }, { "epoch": 0.75, "learning_rate": 7.625412801853543e-07, "loss": 1.0828, "step": 24971 }, { "epoch": 0.75, "learning_rate": 7.623659036730477e-07, "loss": 1.0236, "step": 24972 }, { "epoch": 0.75, "learning_rate": 7.621905437021807e-07, "loss": 1.0523, "step": 24973 }, { "epoch": 0.75, "learning_rate": 7.620152002744227e-07, "loss": 1.1001, "step": 24974 }, { "epoch": 0.75, "learning_rate": 7.618398733914436e-07, "loss": 0.9911, "step": 24975 }, { "epoch": 0.75, "learning_rate": 7.616645630549113e-07, "loss": 1.1995, "step": 24976 }, { "epoch": 0.75, "learning_rate": 7.61489269266495e-07, "loss": 1.1721, "step": 24977 }, { "epoch": 0.75, "learning_rate": 7.613139920278634e-07, "loss": 0.9987, "step": 24978 }, { "epoch": 0.75, "learning_rate": 7.611387313406862e-07, "loss": 1.1116, "step": 24979 }, { "epoch": 0.75, "learning_rate": 7.609634872066302e-07, "loss": 1.2054, "step": 24980 }, { "epoch": 0.75, "learning_rate": 7.607882596273639e-07, "loss": 1.1457, "step": 24981 }, { "epoch": 0.75, "learning_rate": 7.60613048604556e-07, "loss": 1.1085, "step": 24982 }, { "epoch": 0.75, "learning_rate": 7.604378541398738e-07, "loss": 1.0492, "step": 24983 }, { "epoch": 0.75, "learning_rate": 7.602626762349866e-07, "loss": 0.9958, "step": 24984 }, { "epoch": 0.75, "learning_rate": 7.600875148915598e-07, "loss": 1.0657, "step": 24985 }, { "epoch": 0.75, "learning_rate": 7.59912370111262e-07, "loss": 1.2122, "step": 24986 }, { "epoch": 0.75, "learning_rate": 7.597372418957605e-07, "loss": 1.1119, "step": 24987 }, { "epoch": 0.75, "learning_rate": 7.59562130246723e-07, "loss": 1.1733, "step": 24988 }, { "epoch": 0.75, "learning_rate": 7.593870351658147e-07, "loss": 1.0695, "step": 24989 }, { "epoch": 0.75, "learning_rate": 7.592119566547041e-07, "loss": 1.0836, "step": 24990 }, { "epoch": 0.75, "learning_rate": 7.59036894715057e-07, "loss": 1.1548, "step": 24991 }, { "epoch": 0.75, "learning_rate": 7.588618493485409e-07, "loss": 1.2042, "step": 24992 }, { "epoch": 0.75, "learning_rate": 7.586868205568207e-07, "loss": 0.9882, "step": 24993 }, { "epoch": 0.75, "learning_rate": 7.585118083415633e-07, "loss": 1.02, "step": 24994 }, { "epoch": 0.75, "learning_rate": 7.583368127044347e-07, "loss": 1.0486, "step": 24995 }, { "epoch": 0.75, "learning_rate": 7.581618336471008e-07, "loss": 1.1329, "step": 24996 }, { "epoch": 0.75, "learning_rate": 7.579868711712276e-07, "loss": 1.1505, "step": 24997 }, { "epoch": 0.75, "learning_rate": 7.578119252784802e-07, "loss": 1.1121, "step": 24998 }, { "epoch": 0.75, "learning_rate": 7.576369959705243e-07, "loss": 1.0737, "step": 24999 }, { "epoch": 0.75, "learning_rate": 7.574620832490251e-07, "loss": 1.1586, "step": 25000 }, { "epoch": 0.75, "learning_rate": 7.572871871156481e-07, "loss": 1.1637, "step": 25001 }, { "epoch": 0.75, "learning_rate": 7.571123075720573e-07, "loss": 1.0022, "step": 25002 }, { "epoch": 0.75, "learning_rate": 7.569374446199179e-07, "loss": 1.0546, "step": 25003 }, { "epoch": 0.75, "learning_rate": 7.567625982608945e-07, "loss": 1.1211, "step": 25004 }, { "epoch": 0.75, "learning_rate": 7.565877684966521e-07, "loss": 1.2648, "step": 25005 }, { "epoch": 0.75, "learning_rate": 7.56412955328854e-07, "loss": 1.1445, "step": 25006 }, { "epoch": 0.75, "learning_rate": 7.562381587591649e-07, "loss": 1.1593, "step": 25007 }, { "epoch": 0.75, "learning_rate": 7.560633787892486e-07, "loss": 1.1064, "step": 25008 }, { "epoch": 0.75, "learning_rate": 7.558886154207698e-07, "loss": 1.0201, "step": 25009 }, { "epoch": 0.75, "learning_rate": 7.557138686553905e-07, "loss": 1.1274, "step": 25010 }, { "epoch": 0.75, "learning_rate": 7.555391384947752e-07, "loss": 1.163, "step": 25011 }, { "epoch": 0.75, "learning_rate": 7.553644249405872e-07, "loss": 1.0932, "step": 25012 }, { "epoch": 0.75, "learning_rate": 7.551897279944895e-07, "loss": 1.131, "step": 25013 }, { "epoch": 0.75, "learning_rate": 7.550150476581461e-07, "loss": 1.0451, "step": 25014 }, { "epoch": 0.75, "learning_rate": 7.548403839332182e-07, "loss": 1.1047, "step": 25015 }, { "epoch": 0.75, "learning_rate": 7.546657368213695e-07, "loss": 1.042, "step": 25016 }, { "epoch": 0.75, "learning_rate": 7.544911063242622e-07, "loss": 1.0703, "step": 25017 }, { "epoch": 0.75, "learning_rate": 7.543164924435597e-07, "loss": 1.1434, "step": 25018 }, { "epoch": 0.75, "learning_rate": 7.541418951809229e-07, "loss": 1.0213, "step": 25019 }, { "epoch": 0.75, "learning_rate": 7.539673145380142e-07, "loss": 1.0726, "step": 25020 }, { "epoch": 0.75, "learning_rate": 7.537927505164958e-07, "loss": 1.1401, "step": 25021 }, { "epoch": 0.75, "learning_rate": 7.536182031180294e-07, "loss": 1.0329, "step": 25022 }, { "epoch": 0.75, "learning_rate": 7.534436723442767e-07, "loss": 1.0901, "step": 25023 }, { "epoch": 0.75, "learning_rate": 7.53269158196899e-07, "loss": 1.0142, "step": 25024 }, { "epoch": 0.75, "learning_rate": 7.530946606775577e-07, "loss": 1.1311, "step": 25025 }, { "epoch": 0.75, "learning_rate": 7.529201797879138e-07, "loss": 1.1433, "step": 25026 }, { "epoch": 0.75, "learning_rate": 7.527457155296292e-07, "loss": 1.0941, "step": 25027 }, { "epoch": 0.75, "learning_rate": 7.525712679043632e-07, "loss": 1.0487, "step": 25028 }, { "epoch": 0.75, "learning_rate": 7.523968369137771e-07, "loss": 1.1367, "step": 25029 }, { "epoch": 0.75, "learning_rate": 7.522224225595312e-07, "loss": 1.1879, "step": 25030 }, { "epoch": 0.75, "learning_rate": 7.52048024843287e-07, "loss": 1.0931, "step": 25031 }, { "epoch": 0.75, "learning_rate": 7.518736437667032e-07, "loss": 1.1278, "step": 25032 }, { "epoch": 0.75, "learning_rate": 7.516992793314401e-07, "loss": 1.071, "step": 25033 }, { "epoch": 0.75, "learning_rate": 7.515249315391582e-07, "loss": 1.1661, "step": 25034 }, { "epoch": 0.75, "learning_rate": 7.513506003915172e-07, "loss": 1.0516, "step": 25035 }, { "epoch": 0.75, "learning_rate": 7.511762858901758e-07, "loss": 1.1275, "step": 25036 }, { "epoch": 0.75, "learning_rate": 7.510019880367938e-07, "loss": 1.1968, "step": 25037 }, { "epoch": 0.75, "learning_rate": 7.508277068330305e-07, "loss": 1.0926, "step": 25038 }, { "epoch": 0.75, "learning_rate": 7.50653442280545e-07, "loss": 1.027, "step": 25039 }, { "epoch": 0.75, "learning_rate": 7.504791943809972e-07, "loss": 0.9621, "step": 25040 }, { "epoch": 0.75, "learning_rate": 7.50304963136044e-07, "loss": 1.0947, "step": 25041 }, { "epoch": 0.75, "learning_rate": 7.501307485473447e-07, "loss": 1.1658, "step": 25042 }, { "epoch": 0.75, "learning_rate": 7.499565506165579e-07, "loss": 1.0768, "step": 25043 }, { "epoch": 0.75, "learning_rate": 7.49782369345343e-07, "loss": 0.8148, "step": 25044 }, { "epoch": 0.75, "learning_rate": 7.496082047353559e-07, "loss": 1.1536, "step": 25045 }, { "epoch": 0.75, "learning_rate": 7.494340567882558e-07, "loss": 0.9993, "step": 25046 }, { "epoch": 0.75, "learning_rate": 7.492599255057003e-07, "loss": 0.9699, "step": 25047 }, { "epoch": 0.75, "learning_rate": 7.490858108893473e-07, "loss": 1.0647, "step": 25048 }, { "epoch": 0.75, "learning_rate": 7.489117129408541e-07, "loss": 1.1519, "step": 25049 }, { "epoch": 0.75, "learning_rate": 7.487376316618777e-07, "loss": 1.0414, "step": 25050 }, { "epoch": 0.75, "learning_rate": 7.485635670540759e-07, "loss": 1.1286, "step": 25051 }, { "epoch": 0.75, "learning_rate": 7.483895191191063e-07, "loss": 1.1069, "step": 25052 }, { "epoch": 0.75, "learning_rate": 7.48215487858624e-07, "loss": 1.0842, "step": 25053 }, { "epoch": 0.75, "learning_rate": 7.480414732742864e-07, "loss": 1.0475, "step": 25054 }, { "epoch": 0.75, "learning_rate": 7.478674753677503e-07, "loss": 1.0565, "step": 25055 }, { "epoch": 0.75, "learning_rate": 7.476934941406719e-07, "loss": 1.1009, "step": 25056 }, { "epoch": 0.75, "learning_rate": 7.475195295947086e-07, "loss": 1.191, "step": 25057 }, { "epoch": 0.75, "learning_rate": 7.473455817315143e-07, "loss": 1.0286, "step": 25058 }, { "epoch": 0.75, "learning_rate": 7.47171650552746e-07, "loss": 1.1489, "step": 25059 }, { "epoch": 0.75, "learning_rate": 7.469977360600595e-07, "loss": 1.0952, "step": 25060 }, { "epoch": 0.75, "learning_rate": 7.468238382551107e-07, "loss": 1.12, "step": 25061 }, { "epoch": 0.75, "learning_rate": 7.466499571395541e-07, "loss": 1.0449, "step": 25062 }, { "epoch": 0.76, "learning_rate": 7.464760927150455e-07, "loss": 1.0712, "step": 25063 }, { "epoch": 0.76, "learning_rate": 7.463022449832399e-07, "loss": 1.082, "step": 25064 }, { "epoch": 0.76, "learning_rate": 7.461284139457922e-07, "loss": 0.9741, "step": 25065 }, { "epoch": 0.76, "learning_rate": 7.459545996043582e-07, "loss": 1.093, "step": 25066 }, { "epoch": 0.76, "learning_rate": 7.457808019605911e-07, "loss": 1.1259, "step": 25067 }, { "epoch": 0.76, "learning_rate": 7.456070210161457e-07, "loss": 1.0574, "step": 25068 }, { "epoch": 0.76, "learning_rate": 7.454332567726763e-07, "loss": 1.1185, "step": 25069 }, { "epoch": 0.76, "learning_rate": 7.452595092318382e-07, "loss": 1.0558, "step": 25070 }, { "epoch": 0.76, "learning_rate": 7.450857783952839e-07, "loss": 1.0732, "step": 25071 }, { "epoch": 0.76, "learning_rate": 7.449120642646676e-07, "loss": 1.1228, "step": 25072 }, { "epoch": 0.76, "learning_rate": 7.44738366841643e-07, "loss": 0.9308, "step": 25073 }, { "epoch": 0.76, "learning_rate": 7.44564686127865e-07, "loss": 1.0729, "step": 25074 }, { "epoch": 0.76, "learning_rate": 7.443910221249844e-07, "loss": 1.2286, "step": 25075 }, { "epoch": 0.76, "learning_rate": 7.442173748346562e-07, "loss": 1.0263, "step": 25076 }, { "epoch": 0.76, "learning_rate": 7.440437442585327e-07, "loss": 1.1606, "step": 25077 }, { "epoch": 0.76, "learning_rate": 7.438701303982673e-07, "loss": 1.0417, "step": 25078 }, { "epoch": 0.76, "learning_rate": 7.436965332555124e-07, "loss": 1.1358, "step": 25079 }, { "epoch": 0.76, "learning_rate": 7.435229528319204e-07, "loss": 1.1507, "step": 25080 }, { "epoch": 0.76, "learning_rate": 7.433493891291443e-07, "loss": 1.0723, "step": 25081 }, { "epoch": 0.76, "learning_rate": 7.431758421488358e-07, "loss": 1.1104, "step": 25082 }, { "epoch": 0.76, "learning_rate": 7.430023118926479e-07, "loss": 1.1275, "step": 25083 }, { "epoch": 0.76, "learning_rate": 7.428287983622312e-07, "loss": 1.1332, "step": 25084 }, { "epoch": 0.76, "learning_rate": 7.426553015592378e-07, "loss": 1.1539, "step": 25085 }, { "epoch": 0.76, "learning_rate": 7.424818214853197e-07, "loss": 1.1644, "step": 25086 }, { "epoch": 0.76, "learning_rate": 7.42308358142129e-07, "loss": 1.0713, "step": 25087 }, { "epoch": 0.76, "learning_rate": 7.421349115313154e-07, "loss": 1.0882, "step": 25088 }, { "epoch": 0.76, "learning_rate": 7.419614816545309e-07, "loss": 1.0635, "step": 25089 }, { "epoch": 0.76, "learning_rate": 7.417880685134262e-07, "loss": 1.1925, "step": 25090 }, { "epoch": 0.76, "learning_rate": 7.416146721096526e-07, "loss": 1.0105, "step": 25091 }, { "epoch": 0.76, "learning_rate": 7.41441292444861e-07, "loss": 1.2369, "step": 25092 }, { "epoch": 0.76, "learning_rate": 7.412679295207006e-07, "loss": 1.1505, "step": 25093 }, { "epoch": 0.76, "learning_rate": 7.410945833388225e-07, "loss": 1.1099, "step": 25094 }, { "epoch": 0.76, "learning_rate": 7.40921253900877e-07, "loss": 1.1065, "step": 25095 }, { "epoch": 0.76, "learning_rate": 7.407479412085144e-07, "loss": 1.1423, "step": 25096 }, { "epoch": 0.76, "learning_rate": 7.405746452633836e-07, "loss": 1.0788, "step": 25097 }, { "epoch": 0.76, "learning_rate": 7.404013660671347e-07, "loss": 1.0241, "step": 25098 }, { "epoch": 0.76, "learning_rate": 7.402281036214174e-07, "loss": 1.2057, "step": 25099 }, { "epoch": 0.76, "learning_rate": 7.400548579278819e-07, "loss": 1.1729, "step": 25100 }, { "epoch": 0.76, "learning_rate": 7.398816289881755e-07, "loss": 1.069, "step": 25101 }, { "epoch": 0.76, "learning_rate": 7.397084168039484e-07, "loss": 1.0577, "step": 25102 }, { "epoch": 0.76, "learning_rate": 7.395352213768495e-07, "loss": 0.9996, "step": 25103 }, { "epoch": 0.76, "learning_rate": 7.393620427085271e-07, "loss": 1.1286, "step": 25104 }, { "epoch": 0.76, "learning_rate": 7.391888808006306e-07, "loss": 1.1636, "step": 25105 }, { "epoch": 0.76, "learning_rate": 7.390157356548074e-07, "loss": 1.2307, "step": 25106 }, { "epoch": 0.76, "learning_rate": 7.388426072727067e-07, "loss": 1.1257, "step": 25107 }, { "epoch": 0.76, "learning_rate": 7.386694956559759e-07, "loss": 1.2163, "step": 25108 }, { "epoch": 0.76, "learning_rate": 7.384964008062643e-07, "loss": 1.0378, "step": 25109 }, { "epoch": 0.76, "learning_rate": 7.383233227252176e-07, "loss": 0.9921, "step": 25110 }, { "epoch": 0.76, "learning_rate": 7.381502614144842e-07, "loss": 1.1212, "step": 25111 }, { "epoch": 0.76, "learning_rate": 7.379772168757121e-07, "loss": 1.2079, "step": 25112 }, { "epoch": 0.76, "learning_rate": 7.378041891105489e-07, "loss": 1.0554, "step": 25113 }, { "epoch": 0.76, "learning_rate": 7.376311781206405e-07, "loss": 1.1669, "step": 25114 }, { "epoch": 0.76, "learning_rate": 7.374581839076344e-07, "loss": 1.1356, "step": 25115 }, { "epoch": 0.76, "learning_rate": 7.372852064731775e-07, "loss": 1.1002, "step": 25116 }, { "epoch": 0.76, "learning_rate": 7.371122458189165e-07, "loss": 1.1138, "step": 25117 }, { "epoch": 0.76, "learning_rate": 7.369393019464988e-07, "loss": 1.1681, "step": 25118 }, { "epoch": 0.76, "learning_rate": 7.367663748575687e-07, "loss": 1.0128, "step": 25119 }, { "epoch": 0.76, "learning_rate": 7.365934645537737e-07, "loss": 1.1248, "step": 25120 }, { "epoch": 0.76, "learning_rate": 7.364205710367598e-07, "loss": 1.127, "step": 25121 }, { "epoch": 0.76, "learning_rate": 7.362476943081734e-07, "loss": 0.9953, "step": 25122 }, { "epoch": 0.76, "learning_rate": 7.360748343696586e-07, "loss": 1.0829, "step": 25123 }, { "epoch": 0.76, "learning_rate": 7.359019912228618e-07, "loss": 1.1816, "step": 25124 }, { "epoch": 0.76, "learning_rate": 7.357291648694284e-07, "loss": 1.2406, "step": 25125 }, { "epoch": 0.76, "learning_rate": 7.355563553110045e-07, "loss": 1.0854, "step": 25126 }, { "epoch": 0.76, "learning_rate": 7.353835625492337e-07, "loss": 1.0975, "step": 25127 }, { "epoch": 0.76, "learning_rate": 7.352107865857613e-07, "loss": 1.0853, "step": 25128 }, { "epoch": 0.76, "learning_rate": 7.350380274222324e-07, "loss": 1.1816, "step": 25129 }, { "epoch": 0.76, "learning_rate": 7.348652850602914e-07, "loss": 1.1888, "step": 25130 }, { "epoch": 0.76, "learning_rate": 7.346925595015828e-07, "loss": 1.095, "step": 25131 }, { "epoch": 0.76, "learning_rate": 7.345198507477508e-07, "loss": 1.0153, "step": 25132 }, { "epoch": 0.76, "learning_rate": 7.343471588004394e-07, "loss": 1.084, "step": 25133 }, { "epoch": 0.76, "learning_rate": 7.34174483661293e-07, "loss": 0.98, "step": 25134 }, { "epoch": 0.76, "learning_rate": 7.340018253319555e-07, "loss": 1.1421, "step": 25135 }, { "epoch": 0.76, "learning_rate": 7.338291838140695e-07, "loss": 1.1507, "step": 25136 }, { "epoch": 0.76, "learning_rate": 7.336565591092789e-07, "loss": 1.0992, "step": 25137 }, { "epoch": 0.76, "learning_rate": 7.334839512192273e-07, "loss": 1.2504, "step": 25138 }, { "epoch": 0.76, "learning_rate": 7.333113601455585e-07, "loss": 1.0394, "step": 25139 }, { "epoch": 0.76, "learning_rate": 7.331387858899139e-07, "loss": 1.049, "step": 25140 }, { "epoch": 0.76, "learning_rate": 7.329662284539371e-07, "loss": 1.0626, "step": 25141 }, { "epoch": 0.76, "learning_rate": 7.327936878392708e-07, "loss": 1.1845, "step": 25142 }, { "epoch": 0.76, "learning_rate": 7.326211640475572e-07, "loss": 1.1639, "step": 25143 }, { "epoch": 0.76, "learning_rate": 7.324486570804401e-07, "loss": 1.0626, "step": 25144 }, { "epoch": 0.76, "learning_rate": 7.322761669395594e-07, "loss": 1.0649, "step": 25145 }, { "epoch": 0.76, "learning_rate": 7.321036936265585e-07, "loss": 1.1466, "step": 25146 }, { "epoch": 0.76, "learning_rate": 7.31931237143079e-07, "loss": 0.9446, "step": 25147 }, { "epoch": 0.76, "learning_rate": 7.31758797490763e-07, "loss": 1.0657, "step": 25148 }, { "epoch": 0.76, "learning_rate": 7.315863746712512e-07, "loss": 1.1407, "step": 25149 }, { "epoch": 0.76, "learning_rate": 7.314139686861852e-07, "loss": 0.8801, "step": 25150 }, { "epoch": 0.76, "learning_rate": 7.312415795372065e-07, "loss": 1.0413, "step": 25151 }, { "epoch": 0.76, "learning_rate": 7.31069207225957e-07, "loss": 1.0671, "step": 25152 }, { "epoch": 0.76, "learning_rate": 7.308968517540757e-07, "loss": 0.986, "step": 25153 }, { "epoch": 0.76, "learning_rate": 7.307245131232047e-07, "loss": 1.0814, "step": 25154 }, { "epoch": 0.76, "learning_rate": 7.305521913349839e-07, "loss": 1.2462, "step": 25155 }, { "epoch": 0.76, "learning_rate": 7.303798863910542e-07, "loss": 1.1226, "step": 25156 }, { "epoch": 0.76, "learning_rate": 7.302075982930562e-07, "loss": 1.1348, "step": 25157 }, { "epoch": 0.76, "learning_rate": 7.300353270426292e-07, "loss": 1.093, "step": 25158 }, { "epoch": 0.76, "learning_rate": 7.29863072641413e-07, "loss": 1.197, "step": 25159 }, { "epoch": 0.76, "learning_rate": 7.296908350910481e-07, "loss": 1.1575, "step": 25160 }, { "epoch": 0.76, "learning_rate": 7.295186143931738e-07, "loss": 1.0059, "step": 25161 }, { "epoch": 0.76, "learning_rate": 7.293464105494294e-07, "loss": 1.1032, "step": 25162 }, { "epoch": 0.76, "learning_rate": 7.291742235614547e-07, "loss": 1.0034, "step": 25163 }, { "epoch": 0.76, "learning_rate": 7.290020534308884e-07, "loss": 1.1169, "step": 25164 }, { "epoch": 0.76, "learning_rate": 7.288299001593702e-07, "loss": 1.1741, "step": 25165 }, { "epoch": 0.76, "learning_rate": 7.286577637485378e-07, "loss": 0.9876, "step": 25166 }, { "epoch": 0.76, "learning_rate": 7.284856442000301e-07, "loss": 1.0972, "step": 25167 }, { "epoch": 0.76, "learning_rate": 7.283135415154863e-07, "loss": 1.2152, "step": 25168 }, { "epoch": 0.76, "learning_rate": 7.281414556965441e-07, "loss": 1.1041, "step": 25169 }, { "epoch": 0.76, "learning_rate": 7.279693867448426e-07, "loss": 1.0753, "step": 25170 }, { "epoch": 0.76, "learning_rate": 7.277973346620182e-07, "loss": 1.0982, "step": 25171 }, { "epoch": 0.76, "learning_rate": 7.276252994497099e-07, "loss": 1.0354, "step": 25172 }, { "epoch": 0.76, "learning_rate": 7.27453281109555e-07, "loss": 1.0811, "step": 25173 }, { "epoch": 0.76, "learning_rate": 7.272812796431922e-07, "loss": 1.0165, "step": 25174 }, { "epoch": 0.76, "learning_rate": 7.271092950522568e-07, "loss": 1.0898, "step": 25175 }, { "epoch": 0.76, "learning_rate": 7.26937327338387e-07, "loss": 1.0942, "step": 25176 }, { "epoch": 0.76, "learning_rate": 7.267653765032201e-07, "loss": 1.1525, "step": 25177 }, { "epoch": 0.76, "learning_rate": 7.265934425483937e-07, "loss": 1.1163, "step": 25178 }, { "epoch": 0.76, "learning_rate": 7.264215254755425e-07, "loss": 1.0231, "step": 25179 }, { "epoch": 0.76, "learning_rate": 7.262496252863044e-07, "loss": 1.2583, "step": 25180 }, { "epoch": 0.76, "learning_rate": 7.260777419823156e-07, "loss": 1.3821, "step": 25181 }, { "epoch": 0.76, "learning_rate": 7.259058755652123e-07, "loss": 1.203, "step": 25182 }, { "epoch": 0.76, "learning_rate": 7.257340260366314e-07, "loss": 0.9813, "step": 25183 }, { "epoch": 0.76, "learning_rate": 7.255621933982074e-07, "loss": 1.0984, "step": 25184 }, { "epoch": 0.76, "learning_rate": 7.253903776515764e-07, "loss": 1.2005, "step": 25185 }, { "epoch": 0.76, "learning_rate": 7.252185787983745e-07, "loss": 1.2299, "step": 25186 }, { "epoch": 0.76, "learning_rate": 7.250467968402372e-07, "loss": 1.1332, "step": 25187 }, { "epoch": 0.76, "learning_rate": 7.248750317787992e-07, "loss": 1.1008, "step": 25188 }, { "epoch": 0.76, "learning_rate": 7.247032836156961e-07, "loss": 1.181, "step": 25189 }, { "epoch": 0.76, "learning_rate": 7.245315523525629e-07, "loss": 1.0833, "step": 25190 }, { "epoch": 0.76, "learning_rate": 7.243598379910349e-07, "loss": 1.0554, "step": 25191 }, { "epoch": 0.76, "learning_rate": 7.241881405327452e-07, "loss": 1.1406, "step": 25192 }, { "epoch": 0.76, "learning_rate": 7.240164599793292e-07, "loss": 1.2582, "step": 25193 }, { "epoch": 0.76, "learning_rate": 7.238447963324211e-07, "loss": 1.0358, "step": 25194 }, { "epoch": 0.76, "learning_rate": 7.236731495936558e-07, "loss": 1.1735, "step": 25195 }, { "epoch": 0.76, "learning_rate": 7.235015197646661e-07, "loss": 1.1197, "step": 25196 }, { "epoch": 0.76, "learning_rate": 7.233299068470862e-07, "loss": 1.0804, "step": 25197 }, { "epoch": 0.76, "learning_rate": 7.231583108425499e-07, "loss": 1.1007, "step": 25198 }, { "epoch": 0.76, "learning_rate": 7.229867317526907e-07, "loss": 1.2651, "step": 25199 }, { "epoch": 0.76, "learning_rate": 7.228151695791427e-07, "loss": 1.1578, "step": 25200 }, { "epoch": 0.76, "learning_rate": 7.226436243235377e-07, "loss": 1.0679, "step": 25201 }, { "epoch": 0.76, "learning_rate": 7.224720959875095e-07, "loss": 1.1376, "step": 25202 }, { "epoch": 0.76, "learning_rate": 7.223005845726908e-07, "loss": 1.0665, "step": 25203 }, { "epoch": 0.76, "learning_rate": 7.221290900807148e-07, "loss": 1.1171, "step": 25204 }, { "epoch": 0.76, "learning_rate": 7.219576125132132e-07, "loss": 1.2402, "step": 25205 }, { "epoch": 0.76, "learning_rate": 7.217861518718189e-07, "loss": 1.1218, "step": 25206 }, { "epoch": 0.76, "learning_rate": 7.216147081581637e-07, "loss": 1.0962, "step": 25207 }, { "epoch": 0.76, "learning_rate": 7.214432813738808e-07, "loss": 1.11, "step": 25208 }, { "epoch": 0.76, "learning_rate": 7.212718715206008e-07, "loss": 1.1891, "step": 25209 }, { "epoch": 0.76, "learning_rate": 7.211004785999557e-07, "loss": 1.0124, "step": 25210 }, { "epoch": 0.76, "learning_rate": 7.20929102613577e-07, "loss": 1.1023, "step": 25211 }, { "epoch": 0.76, "learning_rate": 7.207577435630969e-07, "loss": 1.1013, "step": 25212 }, { "epoch": 0.76, "learning_rate": 7.20586401450146e-07, "loss": 1.142, "step": 25213 }, { "epoch": 0.76, "learning_rate": 7.204150762763554e-07, "loss": 1.1627, "step": 25214 }, { "epoch": 0.76, "learning_rate": 7.202437680433563e-07, "loss": 1.0724, "step": 25215 }, { "epoch": 0.76, "learning_rate": 7.200724767527795e-07, "loss": 1.0235, "step": 25216 }, { "epoch": 0.76, "learning_rate": 7.19901202406256e-07, "loss": 1.0795, "step": 25217 }, { "epoch": 0.76, "learning_rate": 7.197299450054151e-07, "loss": 1.109, "step": 25218 }, { "epoch": 0.76, "learning_rate": 7.195587045518879e-07, "loss": 1.0911, "step": 25219 }, { "epoch": 0.76, "learning_rate": 7.193874810473042e-07, "loss": 1.1194, "step": 25220 }, { "epoch": 0.76, "learning_rate": 7.192162744932948e-07, "loss": 1.0822, "step": 25221 }, { "epoch": 0.76, "learning_rate": 7.190450848914882e-07, "loss": 1.1883, "step": 25222 }, { "epoch": 0.76, "learning_rate": 7.188739122435143e-07, "loss": 1.0734, "step": 25223 }, { "epoch": 0.76, "learning_rate": 7.187027565510032e-07, "loss": 0.9891, "step": 25224 }, { "epoch": 0.76, "learning_rate": 7.185316178155841e-07, "loss": 1.1508, "step": 25225 }, { "epoch": 0.76, "learning_rate": 7.183604960388866e-07, "loss": 1.1083, "step": 25226 }, { "epoch": 0.76, "learning_rate": 7.181893912225382e-07, "loss": 1.028, "step": 25227 }, { "epoch": 0.76, "learning_rate": 7.18018303368169e-07, "loss": 0.9927, "step": 25228 }, { "epoch": 0.76, "learning_rate": 7.178472324774069e-07, "loss": 1.0609, "step": 25229 }, { "epoch": 0.76, "learning_rate": 7.176761785518818e-07, "loss": 1.1595, "step": 25230 }, { "epoch": 0.76, "learning_rate": 7.175051415932205e-07, "loss": 1.1263, "step": 25231 }, { "epoch": 0.76, "learning_rate": 7.173341216030516e-07, "loss": 1.1317, "step": 25232 }, { "epoch": 0.76, "learning_rate": 7.171631185830033e-07, "loss": 1.024, "step": 25233 }, { "epoch": 0.76, "learning_rate": 7.169921325347043e-07, "loss": 1.0402, "step": 25234 }, { "epoch": 0.76, "learning_rate": 7.168211634597805e-07, "loss": 1.0671, "step": 25235 }, { "epoch": 0.76, "learning_rate": 7.166502113598605e-07, "loss": 1.2133, "step": 25236 }, { "epoch": 0.76, "learning_rate": 7.164792762365719e-07, "loss": 1.2356, "step": 25237 }, { "epoch": 0.76, "learning_rate": 7.163083580915415e-07, "loss": 1.1457, "step": 25238 }, { "epoch": 0.76, "learning_rate": 7.161374569263968e-07, "loss": 1.0732, "step": 25239 }, { "epoch": 0.76, "learning_rate": 7.159665727427639e-07, "loss": 1.0126, "step": 25240 }, { "epoch": 0.76, "learning_rate": 7.157957055422702e-07, "loss": 1.24, "step": 25241 }, { "epoch": 0.76, "learning_rate": 7.156248553265418e-07, "loss": 1.0686, "step": 25242 }, { "epoch": 0.76, "learning_rate": 7.154540220972057e-07, "loss": 1.0547, "step": 25243 }, { "epoch": 0.76, "learning_rate": 7.152832058558875e-07, "loss": 1.1888, "step": 25244 }, { "epoch": 0.76, "learning_rate": 7.15112406604214e-07, "loss": 1.1873, "step": 25245 }, { "epoch": 0.76, "learning_rate": 7.149416243438104e-07, "loss": 1.0382, "step": 25246 }, { "epoch": 0.76, "learning_rate": 7.147708590763036e-07, "loss": 1.0808, "step": 25247 }, { "epoch": 0.76, "learning_rate": 7.146001108033179e-07, "loss": 1.2218, "step": 25248 }, { "epoch": 0.76, "learning_rate": 7.144293795264792e-07, "loss": 1.1727, "step": 25249 }, { "epoch": 0.76, "learning_rate": 7.142586652474129e-07, "loss": 1.086, "step": 25250 }, { "epoch": 0.76, "learning_rate": 7.14087967967744e-07, "loss": 1.1365, "step": 25251 }, { "epoch": 0.76, "learning_rate": 7.139172876890981e-07, "loss": 1.1649, "step": 25252 }, { "epoch": 0.76, "learning_rate": 7.137466244130989e-07, "loss": 1.0543, "step": 25253 }, { "epoch": 0.76, "learning_rate": 7.135759781413714e-07, "loss": 1.0673, "step": 25254 }, { "epoch": 0.76, "learning_rate": 7.134053488755402e-07, "loss": 0.9185, "step": 25255 }, { "epoch": 0.76, "learning_rate": 7.132347366172304e-07, "loss": 1.1273, "step": 25256 }, { "epoch": 0.76, "learning_rate": 7.130641413680648e-07, "loss": 1.0179, "step": 25257 }, { "epoch": 0.76, "learning_rate": 7.128935631296676e-07, "loss": 0.9818, "step": 25258 }, { "epoch": 0.76, "learning_rate": 7.127230019036635e-07, "loss": 0.9666, "step": 25259 }, { "epoch": 0.76, "learning_rate": 7.12552457691676e-07, "loss": 0.9681, "step": 25260 }, { "epoch": 0.76, "learning_rate": 7.123819304953275e-07, "loss": 1.1575, "step": 25261 }, { "epoch": 0.76, "learning_rate": 7.122114203162423e-07, "loss": 1.118, "step": 25262 }, { "epoch": 0.76, "learning_rate": 7.12040927156043e-07, "loss": 1.0901, "step": 25263 }, { "epoch": 0.76, "learning_rate": 7.118704510163532e-07, "loss": 1.0608, "step": 25264 }, { "epoch": 0.76, "learning_rate": 7.116999918987963e-07, "loss": 1.0417, "step": 25265 }, { "epoch": 0.76, "learning_rate": 7.115295498049935e-07, "loss": 1.1707, "step": 25266 }, { "epoch": 0.76, "learning_rate": 7.113591247365678e-07, "loss": 1.1646, "step": 25267 }, { "epoch": 0.76, "learning_rate": 7.11188716695142e-07, "loss": 1.2566, "step": 25268 }, { "epoch": 0.76, "learning_rate": 7.11018325682338e-07, "loss": 1.1605, "step": 25269 }, { "epoch": 0.76, "learning_rate": 7.10847951699778e-07, "loss": 1.1688, "step": 25270 }, { "epoch": 0.76, "learning_rate": 7.106775947490835e-07, "loss": 1.1282, "step": 25271 }, { "epoch": 0.76, "learning_rate": 7.10507254831877e-07, "loss": 1.0486, "step": 25272 }, { "epoch": 0.76, "learning_rate": 7.1033693194978e-07, "loss": 1.1074, "step": 25273 }, { "epoch": 0.76, "learning_rate": 7.10166626104413e-07, "loss": 1.1213, "step": 25274 }, { "epoch": 0.76, "learning_rate": 7.099963372973975e-07, "loss": 1.0876, "step": 25275 }, { "epoch": 0.76, "learning_rate": 7.098260655303549e-07, "loss": 1.1597, "step": 25276 }, { "epoch": 0.76, "learning_rate": 7.096558108049056e-07, "loss": 1.0588, "step": 25277 }, { "epoch": 0.76, "learning_rate": 7.094855731226719e-07, "loss": 1.0157, "step": 25278 }, { "epoch": 0.76, "learning_rate": 7.093153524852725e-07, "loss": 1.1899, "step": 25279 }, { "epoch": 0.76, "learning_rate": 7.091451488943282e-07, "loss": 1.2072, "step": 25280 }, { "epoch": 0.76, "learning_rate": 7.089749623514597e-07, "loss": 1.2053, "step": 25281 }, { "epoch": 0.76, "learning_rate": 7.088047928582878e-07, "loss": 1.075, "step": 25282 }, { "epoch": 0.76, "learning_rate": 7.086346404164307e-07, "loss": 1.2008, "step": 25283 }, { "epoch": 0.76, "learning_rate": 7.084645050275094e-07, "loss": 1.0199, "step": 25284 }, { "epoch": 0.76, "learning_rate": 7.082943866931428e-07, "loss": 1.1638, "step": 25285 }, { "epoch": 0.76, "learning_rate": 7.081242854149517e-07, "loss": 1.1849, "step": 25286 }, { "epoch": 0.76, "learning_rate": 7.079542011945536e-07, "loss": 1.195, "step": 25287 }, { "epoch": 0.76, "learning_rate": 7.077841340335684e-07, "loss": 1.0922, "step": 25288 }, { "epoch": 0.76, "learning_rate": 7.076140839336151e-07, "loss": 1.1291, "step": 25289 }, { "epoch": 0.76, "learning_rate": 7.074440508963124e-07, "loss": 1.0145, "step": 25290 }, { "epoch": 0.76, "learning_rate": 7.072740349232798e-07, "loss": 1.0622, "step": 25291 }, { "epoch": 0.76, "learning_rate": 7.071040360161344e-07, "loss": 1.234, "step": 25292 }, { "epoch": 0.76, "learning_rate": 7.069340541764949e-07, "loss": 1.0767, "step": 25293 }, { "epoch": 0.76, "learning_rate": 7.067640894059796e-07, "loss": 1.1444, "step": 25294 }, { "epoch": 0.76, "learning_rate": 7.065941417062067e-07, "loss": 1.171, "step": 25295 }, { "epoch": 0.76, "learning_rate": 7.064242110787936e-07, "loss": 1.1671, "step": 25296 }, { "epoch": 0.76, "learning_rate": 7.062542975253584e-07, "loss": 1.0009, "step": 25297 }, { "epoch": 0.76, "learning_rate": 7.060844010475182e-07, "loss": 1.1837, "step": 25298 }, { "epoch": 0.76, "learning_rate": 7.059145216468916e-07, "loss": 1.182, "step": 25299 }, { "epoch": 0.76, "learning_rate": 7.057446593250936e-07, "loss": 1.252, "step": 25300 }, { "epoch": 0.76, "learning_rate": 7.055748140837426e-07, "loss": 1.0511, "step": 25301 }, { "epoch": 0.76, "learning_rate": 7.05404985924455e-07, "loss": 1.0659, "step": 25302 }, { "epoch": 0.76, "learning_rate": 7.052351748488476e-07, "loss": 1.0865, "step": 25303 }, { "epoch": 0.76, "learning_rate": 7.050653808585376e-07, "loss": 1.2487, "step": 25304 }, { "epoch": 0.76, "learning_rate": 7.048956039551399e-07, "loss": 1.1722, "step": 25305 }, { "epoch": 0.76, "learning_rate": 7.047258441402719e-07, "loss": 1.0139, "step": 25306 }, { "epoch": 0.76, "learning_rate": 7.045561014155489e-07, "loss": 1.0762, "step": 25307 }, { "epoch": 0.76, "learning_rate": 7.04386375782588e-07, "loss": 1.0172, "step": 25308 }, { "epoch": 0.76, "learning_rate": 7.042166672430031e-07, "loss": 1.0548, "step": 25309 }, { "epoch": 0.76, "learning_rate": 7.040469757984108e-07, "loss": 1.1067, "step": 25310 }, { "epoch": 0.76, "learning_rate": 7.038773014504264e-07, "loss": 1.2003, "step": 25311 }, { "epoch": 0.76, "learning_rate": 7.037076442006654e-07, "loss": 1.0496, "step": 25312 }, { "epoch": 0.76, "learning_rate": 7.035380040507423e-07, "loss": 1.1248, "step": 25313 }, { "epoch": 0.76, "learning_rate": 7.033683810022718e-07, "loss": 1.0938, "step": 25314 }, { "epoch": 0.76, "learning_rate": 7.031987750568692e-07, "loss": 1.0455, "step": 25315 }, { "epoch": 0.76, "learning_rate": 7.030291862161487e-07, "loss": 1.1952, "step": 25316 }, { "epoch": 0.76, "learning_rate": 7.02859614481726e-07, "loss": 1.0306, "step": 25317 }, { "epoch": 0.76, "learning_rate": 7.026900598552131e-07, "loss": 1.0162, "step": 25318 }, { "epoch": 0.76, "learning_rate": 7.025205223382253e-07, "loss": 1.1693, "step": 25319 }, { "epoch": 0.76, "learning_rate": 7.023510019323768e-07, "loss": 1.0538, "step": 25320 }, { "epoch": 0.76, "learning_rate": 7.021814986392813e-07, "loss": 1.059, "step": 25321 }, { "epoch": 0.76, "learning_rate": 7.020120124605515e-07, "loss": 1.0756, "step": 25322 }, { "epoch": 0.76, "learning_rate": 7.018425433978012e-07, "loss": 1.0768, "step": 25323 }, { "epoch": 0.76, "learning_rate": 7.016730914526442e-07, "loss": 1.2098, "step": 25324 }, { "epoch": 0.76, "learning_rate": 7.015036566266931e-07, "loss": 1.1241, "step": 25325 }, { "epoch": 0.76, "learning_rate": 7.01334238921561e-07, "loss": 1.0244, "step": 25326 }, { "epoch": 0.76, "learning_rate": 7.011648383388608e-07, "loss": 1.0109, "step": 25327 }, { "epoch": 0.76, "learning_rate": 7.009954548802047e-07, "loss": 1.0574, "step": 25328 }, { "epoch": 0.76, "learning_rate": 7.008260885472057e-07, "loss": 1.0942, "step": 25329 }, { "epoch": 0.76, "learning_rate": 7.006567393414765e-07, "loss": 1.0716, "step": 25330 }, { "epoch": 0.76, "learning_rate": 7.004874072646279e-07, "loss": 0.9884, "step": 25331 }, { "epoch": 0.76, "learning_rate": 7.003180923182723e-07, "loss": 1.08, "step": 25332 }, { "epoch": 0.76, "learning_rate": 7.001487945040217e-07, "loss": 1.0694, "step": 25333 }, { "epoch": 0.76, "learning_rate": 6.999795138234888e-07, "loss": 1.0494, "step": 25334 }, { "epoch": 0.76, "learning_rate": 6.99810250278283e-07, "loss": 1.108, "step": 25335 }, { "epoch": 0.76, "learning_rate": 6.996410038700166e-07, "loss": 1.1279, "step": 25336 }, { "epoch": 0.76, "learning_rate": 6.994717746003008e-07, "loss": 1.1783, "step": 25337 }, { "epoch": 0.76, "learning_rate": 6.993025624707476e-07, "loss": 1.1241, "step": 25338 }, { "epoch": 0.76, "learning_rate": 6.991333674829656e-07, "loss": 1.1068, "step": 25339 }, { "epoch": 0.76, "learning_rate": 6.989641896385665e-07, "loss": 1.1053, "step": 25340 }, { "epoch": 0.76, "learning_rate": 6.987950289391613e-07, "loss": 0.9799, "step": 25341 }, { "epoch": 0.76, "learning_rate": 6.986258853863597e-07, "loss": 1.1527, "step": 25342 }, { "epoch": 0.76, "learning_rate": 6.984567589817731e-07, "loss": 1.1844, "step": 25343 }, { "epoch": 0.76, "learning_rate": 6.982876497270094e-07, "loss": 1.0764, "step": 25344 }, { "epoch": 0.76, "learning_rate": 6.981185576236799e-07, "loss": 1.0372, "step": 25345 }, { "epoch": 0.76, "learning_rate": 6.979494826733938e-07, "loss": 1.1749, "step": 25346 }, { "epoch": 0.76, "learning_rate": 6.977804248777614e-07, "loss": 1.1956, "step": 25347 }, { "epoch": 0.76, "learning_rate": 6.976113842383905e-07, "loss": 1.0067, "step": 25348 }, { "epoch": 0.76, "learning_rate": 6.974423607568914e-07, "loss": 1.1759, "step": 25349 }, { "epoch": 0.76, "learning_rate": 6.972733544348728e-07, "loss": 1.0138, "step": 25350 }, { "epoch": 0.76, "learning_rate": 6.971043652739437e-07, "loss": 1.0626, "step": 25351 }, { "epoch": 0.76, "learning_rate": 6.969353932757125e-07, "loss": 0.9705, "step": 25352 }, { "epoch": 0.76, "learning_rate": 6.967664384417883e-07, "loss": 1.0406, "step": 25353 }, { "epoch": 0.76, "learning_rate": 6.965975007737789e-07, "loss": 1.0536, "step": 25354 }, { "epoch": 0.76, "learning_rate": 6.964285802732929e-07, "loss": 1.1182, "step": 25355 }, { "epoch": 0.76, "learning_rate": 6.962596769419388e-07, "loss": 1.0286, "step": 25356 }, { "epoch": 0.76, "learning_rate": 6.96090790781323e-07, "loss": 0.9911, "step": 25357 }, { "epoch": 0.76, "learning_rate": 6.959219217930544e-07, "loss": 1.1417, "step": 25358 }, { "epoch": 0.76, "learning_rate": 6.957530699787402e-07, "loss": 1.0613, "step": 25359 }, { "epoch": 0.76, "learning_rate": 6.955842353399883e-07, "loss": 1.062, "step": 25360 }, { "epoch": 0.76, "learning_rate": 6.954154178784048e-07, "loss": 1.0639, "step": 25361 }, { "epoch": 0.76, "learning_rate": 6.952466175955974e-07, "loss": 1.0712, "step": 25362 }, { "epoch": 0.76, "learning_rate": 6.950778344931733e-07, "loss": 1.0773, "step": 25363 }, { "epoch": 0.76, "learning_rate": 6.949090685727394e-07, "loss": 1.0847, "step": 25364 }, { "epoch": 0.76, "learning_rate": 6.94740319835901e-07, "loss": 1.043, "step": 25365 }, { "epoch": 0.76, "learning_rate": 6.945715882842655e-07, "loss": 1.0969, "step": 25366 }, { "epoch": 0.76, "learning_rate": 6.944028739194389e-07, "loss": 1.1765, "step": 25367 }, { "epoch": 0.76, "learning_rate": 6.942341767430272e-07, "loss": 1.2083, "step": 25368 }, { "epoch": 0.76, "learning_rate": 6.940654967566374e-07, "loss": 1.1863, "step": 25369 }, { "epoch": 0.76, "learning_rate": 6.938968339618734e-07, "loss": 0.9915, "step": 25370 }, { "epoch": 0.76, "learning_rate": 6.937281883603417e-07, "loss": 1.0785, "step": 25371 }, { "epoch": 0.76, "learning_rate": 6.935595599536477e-07, "loss": 1.1009, "step": 25372 }, { "epoch": 0.76, "learning_rate": 6.933909487433976e-07, "loss": 1.1835, "step": 25373 }, { "epoch": 0.76, "learning_rate": 6.932223547311947e-07, "loss": 1.058, "step": 25374 }, { "epoch": 0.76, "learning_rate": 6.930537779186447e-07, "loss": 1.1581, "step": 25375 }, { "epoch": 0.76, "learning_rate": 6.928852183073526e-07, "loss": 1.0968, "step": 25376 }, { "epoch": 0.76, "learning_rate": 6.927166758989229e-07, "loss": 1.1971, "step": 25377 }, { "epoch": 0.76, "learning_rate": 6.925481506949599e-07, "loss": 1.0972, "step": 25378 }, { "epoch": 0.76, "learning_rate": 6.923796426970683e-07, "loss": 1.1575, "step": 25379 }, { "epoch": 0.76, "learning_rate": 6.922111519068517e-07, "loss": 1.0153, "step": 25380 }, { "epoch": 0.76, "learning_rate": 6.920426783259151e-07, "loss": 1.2128, "step": 25381 }, { "epoch": 0.76, "learning_rate": 6.918742219558608e-07, "loss": 1.1849, "step": 25382 }, { "epoch": 0.76, "learning_rate": 6.917057827982929e-07, "loss": 1.1224, "step": 25383 }, { "epoch": 0.76, "learning_rate": 6.915373608548151e-07, "loss": 1.037, "step": 25384 }, { "epoch": 0.76, "learning_rate": 6.913689561270306e-07, "loss": 1.191, "step": 25385 }, { "epoch": 0.76, "learning_rate": 6.912005686165432e-07, "loss": 1.103, "step": 25386 }, { "epoch": 0.76, "learning_rate": 6.910321983249549e-07, "loss": 1.1403, "step": 25387 }, { "epoch": 0.76, "learning_rate": 6.908638452538685e-07, "loss": 1.1832, "step": 25388 }, { "epoch": 0.76, "learning_rate": 6.90695509404887e-07, "loss": 1.0871, "step": 25389 }, { "epoch": 0.76, "learning_rate": 6.905271907796137e-07, "loss": 1.0145, "step": 25390 }, { "epoch": 0.76, "learning_rate": 6.903588893796492e-07, "loss": 0.8979, "step": 25391 }, { "epoch": 0.76, "learning_rate": 6.901906052065968e-07, "loss": 1.1001, "step": 25392 }, { "epoch": 0.76, "learning_rate": 6.90022338262058e-07, "loss": 1.0353, "step": 25393 }, { "epoch": 0.76, "learning_rate": 6.898540885476357e-07, "loss": 1.0796, "step": 25394 }, { "epoch": 0.77, "learning_rate": 6.896858560649297e-07, "loss": 1.0858, "step": 25395 }, { "epoch": 0.77, "learning_rate": 6.895176408155427e-07, "loss": 1.0178, "step": 25396 }, { "epoch": 0.77, "learning_rate": 6.893494428010758e-07, "loss": 1.0109, "step": 25397 }, { "epoch": 0.77, "learning_rate": 6.8918126202313e-07, "loss": 1.1562, "step": 25398 }, { "epoch": 0.77, "learning_rate": 6.890130984833074e-07, "loss": 1.1889, "step": 25399 }, { "epoch": 0.77, "learning_rate": 6.888449521832069e-07, "loss": 1.0661, "step": 25400 }, { "epoch": 0.77, "learning_rate": 6.886768231244304e-07, "loss": 1.0867, "step": 25401 }, { "epoch": 0.77, "learning_rate": 6.885087113085781e-07, "loss": 1.1023, "step": 25402 }, { "epoch": 0.77, "learning_rate": 6.883406167372503e-07, "loss": 1.046, "step": 25403 }, { "epoch": 0.77, "learning_rate": 6.881725394120483e-07, "loss": 1.1617, "step": 25404 }, { "epoch": 0.77, "learning_rate": 6.880044793345702e-07, "loss": 1.217, "step": 25405 }, { "epoch": 0.77, "learning_rate": 6.878364365064169e-07, "loss": 1.1476, "step": 25406 }, { "epoch": 0.77, "learning_rate": 6.876684109291878e-07, "loss": 1.1569, "step": 25407 }, { "epoch": 0.77, "learning_rate": 6.875004026044827e-07, "loss": 1.1031, "step": 25408 }, { "epoch": 0.77, "learning_rate": 6.873324115339005e-07, "loss": 1.1227, "step": 25409 }, { "epoch": 0.77, "learning_rate": 6.871644377190412e-07, "loss": 1.1752, "step": 25410 }, { "epoch": 0.77, "learning_rate": 6.869964811615032e-07, "loss": 1.184, "step": 25411 }, { "epoch": 0.77, "learning_rate": 6.868285418628861e-07, "loss": 1.1004, "step": 25412 }, { "epoch": 0.77, "learning_rate": 6.866606198247877e-07, "loss": 1.0986, "step": 25413 }, { "epoch": 0.77, "learning_rate": 6.864927150488065e-07, "loss": 1.1584, "step": 25414 }, { "epoch": 0.77, "learning_rate": 6.863248275365414e-07, "loss": 1.0889, "step": 25415 }, { "epoch": 0.77, "learning_rate": 6.86156957289591e-07, "loss": 1.1178, "step": 25416 }, { "epoch": 0.77, "learning_rate": 6.859891043095524e-07, "loss": 1.1187, "step": 25417 }, { "epoch": 0.77, "learning_rate": 6.858212685980234e-07, "loss": 1.0737, "step": 25418 }, { "epoch": 0.77, "learning_rate": 6.856534501566026e-07, "loss": 1.1905, "step": 25419 }, { "epoch": 0.77, "learning_rate": 6.854856489868877e-07, "loss": 1.1471, "step": 25420 }, { "epoch": 0.77, "learning_rate": 6.853178650904746e-07, "loss": 1.0676, "step": 25421 }, { "epoch": 0.77, "learning_rate": 6.851500984689619e-07, "loss": 1.1607, "step": 25422 }, { "epoch": 0.77, "learning_rate": 6.849823491239457e-07, "loss": 1.0117, "step": 25423 }, { "epoch": 0.77, "learning_rate": 6.848146170570236e-07, "loss": 1.1354, "step": 25424 }, { "epoch": 0.77, "learning_rate": 6.84646902269793e-07, "loss": 1.2274, "step": 25425 }, { "epoch": 0.77, "learning_rate": 6.844792047638487e-07, "loss": 1.2302, "step": 25426 }, { "epoch": 0.77, "learning_rate": 6.84311524540788e-07, "loss": 1.1113, "step": 25427 }, { "epoch": 0.77, "learning_rate": 6.841438616022073e-07, "loss": 1.1368, "step": 25428 }, { "epoch": 0.77, "learning_rate": 6.839762159497029e-07, "loss": 1.1021, "step": 25429 }, { "epoch": 0.77, "learning_rate": 6.838085875848699e-07, "loss": 1.0821, "step": 25430 }, { "epoch": 0.77, "learning_rate": 6.836409765093041e-07, "loss": 1.1259, "step": 25431 }, { "epoch": 0.77, "learning_rate": 6.834733827246018e-07, "loss": 1.0944, "step": 25432 }, { "epoch": 0.77, "learning_rate": 6.833058062323577e-07, "loss": 1.0669, "step": 25433 }, { "epoch": 0.77, "learning_rate": 6.831382470341674e-07, "loss": 1.0943, "step": 25434 }, { "epoch": 0.77, "learning_rate": 6.829707051316262e-07, "loss": 1.1132, "step": 25435 }, { "epoch": 0.77, "learning_rate": 6.828031805263285e-07, "loss": 1.2478, "step": 25436 }, { "epoch": 0.77, "learning_rate": 6.826356732198694e-07, "loss": 1.1526, "step": 25437 }, { "epoch": 0.77, "learning_rate": 6.824681832138444e-07, "loss": 1.0745, "step": 25438 }, { "epoch": 0.77, "learning_rate": 6.823007105098459e-07, "loss": 1.1424, "step": 25439 }, { "epoch": 0.77, "learning_rate": 6.821332551094692e-07, "loss": 1.1475, "step": 25440 }, { "epoch": 0.77, "learning_rate": 6.819658170143087e-07, "loss": 1.0547, "step": 25441 }, { "epoch": 0.77, "learning_rate": 6.817983962259583e-07, "loss": 1.0908, "step": 25442 }, { "epoch": 0.77, "learning_rate": 6.816309927460113e-07, "loss": 1.1967, "step": 25443 }, { "epoch": 0.77, "learning_rate": 6.81463606576061e-07, "loss": 1.0764, "step": 25444 }, { "epoch": 0.77, "learning_rate": 6.812962377177016e-07, "loss": 1.0667, "step": 25445 }, { "epoch": 0.77, "learning_rate": 6.811288861725268e-07, "loss": 1.1293, "step": 25446 }, { "epoch": 0.77, "learning_rate": 6.809615519421284e-07, "loss": 1.0796, "step": 25447 }, { "epoch": 0.77, "learning_rate": 6.807942350280996e-07, "loss": 1.0679, "step": 25448 }, { "epoch": 0.77, "learning_rate": 6.806269354320339e-07, "loss": 1.0247, "step": 25449 }, { "epoch": 0.77, "learning_rate": 6.804596531555232e-07, "loss": 1.1585, "step": 25450 }, { "epoch": 0.77, "learning_rate": 6.802923882001614e-07, "loss": 1.1348, "step": 25451 }, { "epoch": 0.77, "learning_rate": 6.801251405675385e-07, "loss": 1.0356, "step": 25452 }, { "epoch": 0.77, "learning_rate": 6.799579102592479e-07, "loss": 1.1783, "step": 25453 }, { "epoch": 0.77, "learning_rate": 6.797906972768817e-07, "loss": 1.0657, "step": 25454 }, { "epoch": 0.77, "learning_rate": 6.796235016220318e-07, "loss": 1.204, "step": 25455 }, { "epoch": 0.77, "learning_rate": 6.794563232962889e-07, "loss": 0.999, "step": 25456 }, { "epoch": 0.77, "learning_rate": 6.792891623012451e-07, "loss": 1.0881, "step": 25457 }, { "epoch": 0.77, "learning_rate": 6.791220186384914e-07, "loss": 1.0162, "step": 25458 }, { "epoch": 0.77, "learning_rate": 6.789548923096193e-07, "loss": 1.0013, "step": 25459 }, { "epoch": 0.77, "learning_rate": 6.787877833162193e-07, "loss": 1.129, "step": 25460 }, { "epoch": 0.77, "learning_rate": 6.786206916598825e-07, "loss": 1.1045, "step": 25461 }, { "epoch": 0.77, "learning_rate": 6.784536173421999e-07, "loss": 1.1448, "step": 25462 }, { "epoch": 0.77, "learning_rate": 6.782865603647612e-07, "loss": 1.0367, "step": 25463 }, { "epoch": 0.77, "learning_rate": 6.78119520729158e-07, "loss": 1.078, "step": 25464 }, { "epoch": 0.77, "learning_rate": 6.779524984369786e-07, "loss": 1.0761, "step": 25465 }, { "epoch": 0.77, "learning_rate": 6.777854934898139e-07, "loss": 1.1669, "step": 25466 }, { "epoch": 0.77, "learning_rate": 6.77618505889254e-07, "loss": 1.0475, "step": 25467 }, { "epoch": 0.77, "learning_rate": 6.774515356368888e-07, "loss": 0.9987, "step": 25468 }, { "epoch": 0.77, "learning_rate": 6.772845827343063e-07, "loss": 1.1464, "step": 25469 }, { "epoch": 0.77, "learning_rate": 6.77117647183097e-07, "loss": 1.0466, "step": 25470 }, { "epoch": 0.77, "learning_rate": 6.769507289848496e-07, "loss": 1.1949, "step": 25471 }, { "epoch": 0.77, "learning_rate": 6.76783828141154e-07, "loss": 1.1215, "step": 25472 }, { "epoch": 0.77, "learning_rate": 6.766169446535975e-07, "loss": 1.1289, "step": 25473 }, { "epoch": 0.77, "learning_rate": 6.764500785237696e-07, "loss": 1.2128, "step": 25474 }, { "epoch": 0.77, "learning_rate": 6.762832297532587e-07, "loss": 1.0923, "step": 25475 }, { "epoch": 0.77, "learning_rate": 6.761163983436531e-07, "loss": 1.1119, "step": 25476 }, { "epoch": 0.77, "learning_rate": 6.759495842965416e-07, "loss": 1.1815, "step": 25477 }, { "epoch": 0.77, "learning_rate": 6.757827876135109e-07, "loss": 1.1462, "step": 25478 }, { "epoch": 0.77, "learning_rate": 6.756160082961497e-07, "loss": 1.0472, "step": 25479 }, { "epoch": 0.77, "learning_rate": 6.754492463460452e-07, "loss": 1.1124, "step": 25480 }, { "epoch": 0.77, "learning_rate": 6.75282501764786e-07, "loss": 0.9057, "step": 25481 }, { "epoch": 0.77, "learning_rate": 6.751157745539577e-07, "loss": 1.1444, "step": 25482 }, { "epoch": 0.77, "learning_rate": 6.749490647151482e-07, "loss": 1.1262, "step": 25483 }, { "epoch": 0.77, "learning_rate": 6.74782372249945e-07, "loss": 1.0135, "step": 25484 }, { "epoch": 0.77, "learning_rate": 6.746156971599344e-07, "loss": 1.0589, "step": 25485 }, { "epoch": 0.77, "learning_rate": 6.744490394467041e-07, "loss": 1.1326, "step": 25486 }, { "epoch": 0.77, "learning_rate": 6.742823991118386e-07, "loss": 1.1365, "step": 25487 }, { "epoch": 0.77, "learning_rate": 6.741157761569255e-07, "loss": 1.1312, "step": 25488 }, { "epoch": 0.77, "learning_rate": 6.73949170583551e-07, "loss": 1.0723, "step": 25489 }, { "epoch": 0.77, "learning_rate": 6.737825823933008e-07, "loss": 0.9454, "step": 25490 }, { "epoch": 0.77, "learning_rate": 6.73616011587761e-07, "loss": 1.0068, "step": 25491 }, { "epoch": 0.77, "learning_rate": 6.734494581685172e-07, "loss": 1.1343, "step": 25492 }, { "epoch": 0.77, "learning_rate": 6.732829221371548e-07, "loss": 1.1382, "step": 25493 }, { "epoch": 0.77, "learning_rate": 6.7311640349526e-07, "loss": 1.0158, "step": 25494 }, { "epoch": 0.77, "learning_rate": 6.729499022444163e-07, "loss": 1.1255, "step": 25495 }, { "epoch": 0.77, "learning_rate": 6.727834183862098e-07, "loss": 1.1943, "step": 25496 }, { "epoch": 0.77, "learning_rate": 6.726169519222248e-07, "loss": 1.0735, "step": 25497 }, { "epoch": 0.77, "learning_rate": 6.724505028540474e-07, "loss": 0.9561, "step": 25498 }, { "epoch": 0.77, "learning_rate": 6.722840711832602e-07, "loss": 1.1005, "step": 25499 }, { "epoch": 0.77, "learning_rate": 6.721176569114482e-07, "loss": 1.0173, "step": 25500 }, { "epoch": 0.77, "learning_rate": 6.719512600401959e-07, "loss": 1.0744, "step": 25501 }, { "epoch": 0.77, "learning_rate": 6.717848805710872e-07, "loss": 1.0439, "step": 25502 }, { "epoch": 0.77, "learning_rate": 6.716185185057067e-07, "loss": 1.1101, "step": 25503 }, { "epoch": 0.77, "learning_rate": 6.714521738456364e-07, "loss": 1.1641, "step": 25504 }, { "epoch": 0.77, "learning_rate": 6.712858465924609e-07, "loss": 1.0616, "step": 25505 }, { "epoch": 0.77, "learning_rate": 6.711195367477635e-07, "loss": 0.9598, "step": 25506 }, { "epoch": 0.77, "learning_rate": 6.709532443131281e-07, "loss": 1.1187, "step": 25507 }, { "epoch": 0.77, "learning_rate": 6.707869692901358e-07, "loss": 1.1121, "step": 25508 }, { "epoch": 0.77, "learning_rate": 6.706207116803709e-07, "loss": 1.0948, "step": 25509 }, { "epoch": 0.77, "learning_rate": 6.704544714854155e-07, "loss": 0.9792, "step": 25510 }, { "epoch": 0.77, "learning_rate": 6.702882487068535e-07, "loss": 0.9614, "step": 25511 }, { "epoch": 0.77, "learning_rate": 6.701220433462651e-07, "loss": 1.1381, "step": 25512 }, { "epoch": 0.77, "learning_rate": 6.699558554052335e-07, "loss": 1.1395, "step": 25513 }, { "epoch": 0.77, "learning_rate": 6.697896848853411e-07, "loss": 1.0392, "step": 25514 }, { "epoch": 0.77, "learning_rate": 6.696235317881692e-07, "loss": 1.0912, "step": 25515 }, { "epoch": 0.77, "learning_rate": 6.694573961152998e-07, "loss": 1.0407, "step": 25516 }, { "epoch": 0.77, "learning_rate": 6.692912778683144e-07, "loss": 1.1863, "step": 25517 }, { "epoch": 0.77, "learning_rate": 6.691251770487941e-07, "loss": 1.1934, "step": 25518 }, { "epoch": 0.77, "learning_rate": 6.689590936583207e-07, "loss": 1.0542, "step": 25519 }, { "epoch": 0.77, "learning_rate": 6.687930276984755e-07, "loss": 1.1521, "step": 25520 }, { "epoch": 0.77, "learning_rate": 6.686269791708377e-07, "loss": 1.0695, "step": 25521 }, { "epoch": 0.77, "learning_rate": 6.684609480769894e-07, "loss": 1.1529, "step": 25522 }, { "epoch": 0.77, "learning_rate": 6.682949344185108e-07, "loss": 1.1418, "step": 25523 }, { "epoch": 0.77, "learning_rate": 6.681289381969828e-07, "loss": 1.2383, "step": 25524 }, { "epoch": 0.77, "learning_rate": 6.679629594139842e-07, "loss": 1.1454, "step": 25525 }, { "epoch": 0.77, "learning_rate": 6.67796998071096e-07, "loss": 1.1147, "step": 25526 }, { "epoch": 0.77, "learning_rate": 6.676310541698979e-07, "loss": 1.1443, "step": 25527 }, { "epoch": 0.77, "learning_rate": 6.6746512771197e-07, "loss": 1.2234, "step": 25528 }, { "epoch": 0.77, "learning_rate": 6.672992186988919e-07, "loss": 1.0308, "step": 25529 }, { "epoch": 0.77, "learning_rate": 6.67133327132242e-07, "loss": 1.1492, "step": 25530 }, { "epoch": 0.77, "learning_rate": 6.669674530136e-07, "loss": 1.0048, "step": 25531 }, { "epoch": 0.77, "learning_rate": 6.668015963445451e-07, "loss": 1.0685, "step": 25532 }, { "epoch": 0.77, "learning_rate": 6.666357571266568e-07, "loss": 1.0853, "step": 25533 }, { "epoch": 0.77, "learning_rate": 6.664699353615123e-07, "loss": 1.1216, "step": 25534 }, { "epoch": 0.77, "learning_rate": 6.663041310506909e-07, "loss": 1.1525, "step": 25535 }, { "epoch": 0.77, "learning_rate": 6.661383441957714e-07, "loss": 1.2213, "step": 25536 }, { "epoch": 0.77, "learning_rate": 6.65972574798332e-07, "loss": 1.2118, "step": 25537 }, { "epoch": 0.77, "learning_rate": 6.658068228599499e-07, "loss": 1.0068, "step": 25538 }, { "epoch": 0.77, "learning_rate": 6.656410883822034e-07, "loss": 1.1109, "step": 25539 }, { "epoch": 0.77, "learning_rate": 6.654753713666703e-07, "loss": 1.0609, "step": 25540 }, { "epoch": 0.77, "learning_rate": 6.653096718149279e-07, "loss": 1.1569, "step": 25541 }, { "epoch": 0.77, "learning_rate": 6.651439897285541e-07, "loss": 1.1116, "step": 25542 }, { "epoch": 0.77, "learning_rate": 6.649783251091257e-07, "loss": 1.1755, "step": 25543 }, { "epoch": 0.77, "learning_rate": 6.648126779582198e-07, "loss": 1.1031, "step": 25544 }, { "epoch": 0.77, "learning_rate": 6.646470482774134e-07, "loss": 1.0847, "step": 25545 }, { "epoch": 0.77, "learning_rate": 6.644814360682841e-07, "loss": 1.1179, "step": 25546 }, { "epoch": 0.77, "learning_rate": 6.643158413324067e-07, "loss": 1.1202, "step": 25547 }, { "epoch": 0.77, "learning_rate": 6.641502640713582e-07, "loss": 1.1299, "step": 25548 }, { "epoch": 0.77, "learning_rate": 6.63984704286715e-07, "loss": 1.0867, "step": 25549 }, { "epoch": 0.77, "learning_rate": 6.638191619800541e-07, "loss": 1.0836, "step": 25550 }, { "epoch": 0.77, "learning_rate": 6.636536371529495e-07, "loss": 1.1939, "step": 25551 }, { "epoch": 0.77, "learning_rate": 6.634881298069781e-07, "loss": 1.0674, "step": 25552 }, { "epoch": 0.77, "learning_rate": 6.633226399437151e-07, "loss": 1.0513, "step": 25553 }, { "epoch": 0.77, "learning_rate": 6.631571675647358e-07, "loss": 1.0539, "step": 25554 }, { "epoch": 0.77, "learning_rate": 6.629917126716165e-07, "loss": 1.2223, "step": 25555 }, { "epoch": 0.77, "learning_rate": 6.628262752659306e-07, "loss": 1.2294, "step": 25556 }, { "epoch": 0.77, "learning_rate": 6.626608553492539e-07, "loss": 1.101, "step": 25557 }, { "epoch": 0.77, "learning_rate": 6.624954529231609e-07, "loss": 1.0984, "step": 25558 }, { "epoch": 0.77, "learning_rate": 6.623300679892269e-07, "loss": 1.1563, "step": 25559 }, { "epoch": 0.77, "learning_rate": 6.621647005490248e-07, "loss": 1.0409, "step": 25560 }, { "epoch": 0.77, "learning_rate": 6.619993506041298e-07, "loss": 1.2964, "step": 25561 }, { "epoch": 0.77, "learning_rate": 6.618340181561156e-07, "loss": 1.124, "step": 25562 }, { "epoch": 0.77, "learning_rate": 6.616687032065572e-07, "loss": 1.1249, "step": 25563 }, { "epoch": 0.77, "learning_rate": 6.615034057570263e-07, "loss": 1.1613, "step": 25564 }, { "epoch": 0.77, "learning_rate": 6.613381258090979e-07, "loss": 1.011, "step": 25565 }, { "epoch": 0.77, "learning_rate": 6.611728633643447e-07, "loss": 1.2272, "step": 25566 }, { "epoch": 0.77, "learning_rate": 6.610076184243402e-07, "loss": 1.0762, "step": 25567 }, { "epoch": 0.77, "learning_rate": 6.608423909906586e-07, "loss": 1.1149, "step": 25568 }, { "epoch": 0.77, "learning_rate": 6.606771810648708e-07, "loss": 1.1615, "step": 25569 }, { "epoch": 0.77, "learning_rate": 6.605119886485501e-07, "loss": 1.093, "step": 25570 }, { "epoch": 0.77, "learning_rate": 6.603468137432694e-07, "loss": 1.0849, "step": 25571 }, { "epoch": 0.77, "learning_rate": 6.601816563506013e-07, "loss": 1.0123, "step": 25572 }, { "epoch": 0.77, "learning_rate": 6.600165164721175e-07, "loss": 1.1345, "step": 25573 }, { "epoch": 0.77, "learning_rate": 6.598513941093906e-07, "loss": 1.1265, "step": 25574 }, { "epoch": 0.77, "learning_rate": 6.596862892639918e-07, "loss": 1.0416, "step": 25575 }, { "epoch": 0.77, "learning_rate": 6.595212019374944e-07, "loss": 1.1135, "step": 25576 }, { "epoch": 0.77, "learning_rate": 6.593561321314676e-07, "loss": 1.1276, "step": 25577 }, { "epoch": 0.77, "learning_rate": 6.59191079847484e-07, "loss": 1.124, "step": 25578 }, { "epoch": 0.77, "learning_rate": 6.59026045087115e-07, "loss": 0.8851, "step": 25579 }, { "epoch": 0.77, "learning_rate": 6.58861027851932e-07, "loss": 1.1356, "step": 25580 }, { "epoch": 0.77, "learning_rate": 6.586960281435046e-07, "loss": 1.2795, "step": 25581 }, { "epoch": 0.77, "learning_rate": 6.585310459634039e-07, "loss": 1.0338, "step": 25582 }, { "epoch": 0.77, "learning_rate": 6.583660813132011e-07, "loss": 1.0766, "step": 25583 }, { "epoch": 0.77, "learning_rate": 6.58201134194466e-07, "loss": 1.0544, "step": 25584 }, { "epoch": 0.77, "learning_rate": 6.580362046087701e-07, "loss": 1.0671, "step": 25585 }, { "epoch": 0.77, "learning_rate": 6.578712925576817e-07, "loss": 1.0654, "step": 25586 }, { "epoch": 0.77, "learning_rate": 6.577063980427711e-07, "loss": 1.0636, "step": 25587 }, { "epoch": 0.77, "learning_rate": 6.575415210656083e-07, "loss": 1.004, "step": 25588 }, { "epoch": 0.77, "learning_rate": 6.573766616277638e-07, "loss": 0.9724, "step": 25589 }, { "epoch": 0.77, "learning_rate": 6.572118197308052e-07, "loss": 1.0444, "step": 25590 }, { "epoch": 0.77, "learning_rate": 6.570469953763029e-07, "loss": 1.1517, "step": 25591 }, { "epoch": 0.77, "learning_rate": 6.568821885658253e-07, "loss": 1.1588, "step": 25592 }, { "epoch": 0.77, "learning_rate": 6.567173993009421e-07, "loss": 1.1407, "step": 25593 }, { "epoch": 0.77, "learning_rate": 6.565526275832209e-07, "loss": 1.1832, "step": 25594 }, { "epoch": 0.77, "learning_rate": 6.563878734142312e-07, "loss": 1.0947, "step": 25595 }, { "epoch": 0.77, "learning_rate": 6.562231367955407e-07, "loss": 1.2042, "step": 25596 }, { "epoch": 0.77, "learning_rate": 6.56058417728718e-07, "loss": 1.0484, "step": 25597 }, { "epoch": 0.77, "learning_rate": 6.558937162153311e-07, "loss": 1.2158, "step": 25598 }, { "epoch": 0.77, "learning_rate": 6.557290322569479e-07, "loss": 1.1454, "step": 25599 }, { "epoch": 0.77, "learning_rate": 6.555643658551361e-07, "loss": 1.1119, "step": 25600 }, { "epoch": 0.77, "learning_rate": 6.553997170114631e-07, "loss": 1.0952, "step": 25601 }, { "epoch": 0.77, "learning_rate": 6.552350857274972e-07, "loss": 1.1426, "step": 25602 }, { "epoch": 0.77, "learning_rate": 6.550704720048043e-07, "loss": 1.1721, "step": 25603 }, { "epoch": 0.77, "learning_rate": 6.549058758449517e-07, "loss": 1.2529, "step": 25604 }, { "epoch": 0.77, "learning_rate": 6.547412972495065e-07, "loss": 1.1802, "step": 25605 }, { "epoch": 0.77, "learning_rate": 6.545767362200364e-07, "loss": 1.1025, "step": 25606 }, { "epoch": 0.77, "learning_rate": 6.544121927581059e-07, "loss": 1.1519, "step": 25607 }, { "epoch": 0.77, "learning_rate": 6.542476668652828e-07, "loss": 1.1231, "step": 25608 }, { "epoch": 0.77, "learning_rate": 6.540831585431329e-07, "loss": 1.1038, "step": 25609 }, { "epoch": 0.77, "learning_rate": 6.539186677932222e-07, "loss": 1.0325, "step": 25610 }, { "epoch": 0.77, "learning_rate": 6.537541946171175e-07, "loss": 1.1178, "step": 25611 }, { "epoch": 0.77, "learning_rate": 6.535897390163828e-07, "loss": 1.2004, "step": 25612 }, { "epoch": 0.77, "learning_rate": 6.534253009925848e-07, "loss": 1.1888, "step": 25613 }, { "epoch": 0.77, "learning_rate": 6.532608805472885e-07, "loss": 1.0723, "step": 25614 }, { "epoch": 0.77, "learning_rate": 6.530964776820597e-07, "loss": 1.0851, "step": 25615 }, { "epoch": 0.77, "learning_rate": 6.529320923984625e-07, "loss": 1.0915, "step": 25616 }, { "epoch": 0.77, "learning_rate": 6.527677246980621e-07, "loss": 1.0522, "step": 25617 }, { "epoch": 0.77, "learning_rate": 6.526033745824231e-07, "loss": 1.1686, "step": 25618 }, { "epoch": 0.77, "learning_rate": 6.524390420531112e-07, "loss": 1.1359, "step": 25619 }, { "epoch": 0.77, "learning_rate": 6.522747271116891e-07, "loss": 1.101, "step": 25620 }, { "epoch": 0.77, "learning_rate": 6.521104297597216e-07, "loss": 1.1119, "step": 25621 }, { "epoch": 0.77, "learning_rate": 6.519461499987728e-07, "loss": 1.1544, "step": 25622 }, { "epoch": 0.77, "learning_rate": 6.517818878304066e-07, "loss": 1.0468, "step": 25623 }, { "epoch": 0.77, "learning_rate": 6.516176432561869e-07, "loss": 1.1111, "step": 25624 }, { "epoch": 0.77, "learning_rate": 6.51453416277677e-07, "loss": 1.199, "step": 25625 }, { "epoch": 0.77, "learning_rate": 6.512892068964399e-07, "loss": 1.0513, "step": 25626 }, { "epoch": 0.77, "learning_rate": 6.511250151140396e-07, "loss": 1.1151, "step": 25627 }, { "epoch": 0.77, "learning_rate": 6.509608409320392e-07, "loss": 1.0611, "step": 25628 }, { "epoch": 0.77, "learning_rate": 6.507966843520005e-07, "loss": 1.0931, "step": 25629 }, { "epoch": 0.77, "learning_rate": 6.506325453754866e-07, "loss": 1.1722, "step": 25630 }, { "epoch": 0.77, "learning_rate": 6.504684240040604e-07, "loss": 1.1625, "step": 25631 }, { "epoch": 0.77, "learning_rate": 6.503043202392844e-07, "loss": 1.0297, "step": 25632 }, { "epoch": 0.77, "learning_rate": 6.5014023408272e-07, "loss": 1.0748, "step": 25633 }, { "epoch": 0.77, "learning_rate": 6.499761655359297e-07, "loss": 1.0684, "step": 25634 }, { "epoch": 0.77, "learning_rate": 6.498121146004751e-07, "loss": 1.1367, "step": 25635 }, { "epoch": 0.77, "learning_rate": 6.496480812779182e-07, "loss": 1.1837, "step": 25636 }, { "epoch": 0.77, "learning_rate": 6.494840655698212e-07, "loss": 1.1636, "step": 25637 }, { "epoch": 0.77, "learning_rate": 6.493200674777437e-07, "loss": 1.1538, "step": 25638 }, { "epoch": 0.77, "learning_rate": 6.491560870032479e-07, "loss": 1.0843, "step": 25639 }, { "epoch": 0.77, "learning_rate": 6.48992124147895e-07, "loss": 1.0385, "step": 25640 }, { "epoch": 0.77, "learning_rate": 6.488281789132461e-07, "loss": 1.1432, "step": 25641 }, { "epoch": 0.77, "learning_rate": 6.486642513008607e-07, "loss": 1.1315, "step": 25642 }, { "epoch": 0.77, "learning_rate": 6.485003413123001e-07, "loss": 1.1052, "step": 25643 }, { "epoch": 0.77, "learning_rate": 6.483364489491242e-07, "loss": 1.0507, "step": 25644 }, { "epoch": 0.77, "learning_rate": 6.481725742128947e-07, "loss": 1.0889, "step": 25645 }, { "epoch": 0.77, "learning_rate": 6.480087171051694e-07, "loss": 1.1166, "step": 25646 }, { "epoch": 0.77, "learning_rate": 6.478448776275092e-07, "loss": 1.1154, "step": 25647 }, { "epoch": 0.77, "learning_rate": 6.476810557814736e-07, "loss": 1.1598, "step": 25648 }, { "epoch": 0.77, "learning_rate": 6.475172515686226e-07, "loss": 1.0765, "step": 25649 }, { "epoch": 0.77, "learning_rate": 6.47353464990515e-07, "loss": 1.1215, "step": 25650 }, { "epoch": 0.77, "learning_rate": 6.471896960487109e-07, "loss": 1.0873, "step": 25651 }, { "epoch": 0.77, "learning_rate": 6.470259447447677e-07, "loss": 1.0635, "step": 25652 }, { "epoch": 0.77, "learning_rate": 6.468622110802453e-07, "loss": 1.0634, "step": 25653 }, { "epoch": 0.77, "learning_rate": 6.466984950567018e-07, "loss": 1.1729, "step": 25654 }, { "epoch": 0.77, "learning_rate": 6.465347966756963e-07, "loss": 1.1404, "step": 25655 }, { "epoch": 0.77, "learning_rate": 6.46371115938787e-07, "loss": 1.152, "step": 25656 }, { "epoch": 0.77, "learning_rate": 6.462074528475318e-07, "loss": 1.0739, "step": 25657 }, { "epoch": 0.77, "learning_rate": 6.460438074034895e-07, "loss": 1.0476, "step": 25658 }, { "epoch": 0.77, "learning_rate": 6.458801796082165e-07, "loss": 1.0533, "step": 25659 }, { "epoch": 0.77, "learning_rate": 6.457165694632714e-07, "loss": 1.0353, "step": 25660 }, { "epoch": 0.77, "learning_rate": 6.455529769702112e-07, "loss": 1.2949, "step": 25661 }, { "epoch": 0.77, "learning_rate": 6.453894021305937e-07, "loss": 1.0638, "step": 25662 }, { "epoch": 0.77, "learning_rate": 6.452258449459767e-07, "loss": 1.0716, "step": 25663 }, { "epoch": 0.77, "learning_rate": 6.450623054179156e-07, "loss": 1.0917, "step": 25664 }, { "epoch": 0.77, "learning_rate": 6.44898783547968e-07, "loss": 1.0451, "step": 25665 }, { "epoch": 0.77, "learning_rate": 6.447352793376905e-07, "loss": 1.0757, "step": 25666 }, { "epoch": 0.77, "learning_rate": 6.445717927886402e-07, "loss": 1.1619, "step": 25667 }, { "epoch": 0.77, "learning_rate": 6.444083239023724e-07, "loss": 1.1961, "step": 25668 }, { "epoch": 0.77, "learning_rate": 6.442448726804434e-07, "loss": 1.1157, "step": 25669 }, { "epoch": 0.77, "learning_rate": 6.440814391244097e-07, "loss": 1.0001, "step": 25670 }, { "epoch": 0.77, "learning_rate": 6.439180232358272e-07, "loss": 1.0298, "step": 25671 }, { "epoch": 0.77, "learning_rate": 6.437546250162508e-07, "loss": 1.0765, "step": 25672 }, { "epoch": 0.77, "learning_rate": 6.435912444672363e-07, "loss": 1.0137, "step": 25673 }, { "epoch": 0.77, "learning_rate": 6.434278815903392e-07, "loss": 1.1285, "step": 25674 }, { "epoch": 0.77, "learning_rate": 6.432645363871143e-07, "loss": 1.1197, "step": 25675 }, { "epoch": 0.77, "learning_rate": 6.431012088591173e-07, "loss": 1.0876, "step": 25676 }, { "epoch": 0.77, "learning_rate": 6.429378990079021e-07, "loss": 1.0276, "step": 25677 }, { "epoch": 0.77, "learning_rate": 6.427746068350238e-07, "loss": 1.0644, "step": 25678 }, { "epoch": 0.77, "learning_rate": 6.426113323420366e-07, "loss": 1.0793, "step": 25679 }, { "epoch": 0.77, "learning_rate": 6.424480755304949e-07, "loss": 1.0209, "step": 25680 }, { "epoch": 0.77, "learning_rate": 6.422848364019529e-07, "loss": 1.0374, "step": 25681 }, { "epoch": 0.77, "learning_rate": 6.421216149579645e-07, "loss": 1.0328, "step": 25682 }, { "epoch": 0.77, "learning_rate": 6.419584112000838e-07, "loss": 1.0605, "step": 25683 }, { "epoch": 0.77, "learning_rate": 6.417952251298648e-07, "loss": 1.0743, "step": 25684 }, { "epoch": 0.77, "learning_rate": 6.416320567488596e-07, "loss": 1.1523, "step": 25685 }, { "epoch": 0.77, "learning_rate": 6.414689060586221e-07, "loss": 1.0688, "step": 25686 }, { "epoch": 0.77, "learning_rate": 6.413057730607056e-07, "loss": 1.171, "step": 25687 }, { "epoch": 0.77, "learning_rate": 6.411426577566629e-07, "loss": 1.0568, "step": 25688 }, { "epoch": 0.77, "learning_rate": 6.409795601480475e-07, "loss": 1.0768, "step": 25689 }, { "epoch": 0.77, "learning_rate": 6.408164802364105e-07, "loss": 1.1361, "step": 25690 }, { "epoch": 0.77, "learning_rate": 6.406534180233057e-07, "loss": 1.0474, "step": 25691 }, { "epoch": 0.77, "learning_rate": 6.404903735102844e-07, "loss": 1.2344, "step": 25692 }, { "epoch": 0.77, "learning_rate": 6.403273466989001e-07, "loss": 1.0212, "step": 25693 }, { "epoch": 0.77, "learning_rate": 6.401643375907029e-07, "loss": 1.0047, "step": 25694 }, { "epoch": 0.77, "learning_rate": 6.400013461872457e-07, "loss": 1.0799, "step": 25695 }, { "epoch": 0.77, "learning_rate": 6.398383724900798e-07, "loss": 1.1565, "step": 25696 }, { "epoch": 0.77, "learning_rate": 6.396754165007577e-07, "loss": 1.1376, "step": 25697 }, { "epoch": 0.77, "learning_rate": 6.395124782208284e-07, "loss": 1.1234, "step": 25698 }, { "epoch": 0.77, "learning_rate": 6.393495576518446e-07, "loss": 1.0785, "step": 25699 }, { "epoch": 0.77, "learning_rate": 6.391866547953568e-07, "loss": 1.1001, "step": 25700 }, { "epoch": 0.77, "learning_rate": 6.390237696529162e-07, "loss": 1.1578, "step": 25701 }, { "epoch": 0.77, "learning_rate": 6.388609022260733e-07, "loss": 1.0087, "step": 25702 }, { "epoch": 0.77, "learning_rate": 6.386980525163777e-07, "loss": 1.1346, "step": 25703 }, { "epoch": 0.77, "learning_rate": 6.3853522052538e-07, "loss": 1.0936, "step": 25704 }, { "epoch": 0.77, "learning_rate": 6.38372406254631e-07, "loss": 1.1265, "step": 25705 }, { "epoch": 0.77, "learning_rate": 6.382096097056795e-07, "loss": 1.159, "step": 25706 }, { "epoch": 0.77, "learning_rate": 6.380468308800764e-07, "loss": 1.0955, "step": 25707 }, { "epoch": 0.77, "learning_rate": 6.378840697793703e-07, "loss": 1.0934, "step": 25708 }, { "epoch": 0.77, "learning_rate": 6.37721326405111e-07, "loss": 1.0905, "step": 25709 }, { "epoch": 0.77, "learning_rate": 6.375586007588489e-07, "loss": 1.1417, "step": 25710 }, { "epoch": 0.77, "learning_rate": 6.373958928421309e-07, "loss": 1.1105, "step": 25711 }, { "epoch": 0.77, "learning_rate": 6.37233202656507e-07, "loss": 1.1376, "step": 25712 }, { "epoch": 0.77, "learning_rate": 6.37070530203526e-07, "loss": 1.0771, "step": 25713 }, { "epoch": 0.77, "learning_rate": 6.369078754847361e-07, "loss": 1.1614, "step": 25714 }, { "epoch": 0.77, "learning_rate": 6.367452385016868e-07, "loss": 1.0914, "step": 25715 }, { "epoch": 0.77, "learning_rate": 6.365826192559249e-07, "loss": 1.1426, "step": 25716 }, { "epoch": 0.77, "learning_rate": 6.364200177489988e-07, "loss": 1.0805, "step": 25717 }, { "epoch": 0.77, "learning_rate": 6.362574339824565e-07, "loss": 1.1544, "step": 25718 }, { "epoch": 0.77, "learning_rate": 6.360948679578466e-07, "loss": 1.1066, "step": 25719 }, { "epoch": 0.77, "learning_rate": 6.359323196767153e-07, "loss": 1.0936, "step": 25720 }, { "epoch": 0.77, "learning_rate": 6.357697891406107e-07, "loss": 1.0234, "step": 25721 }, { "epoch": 0.77, "learning_rate": 6.356072763510795e-07, "loss": 1.0993, "step": 25722 }, { "epoch": 0.77, "learning_rate": 6.354447813096697e-07, "loss": 1.1862, "step": 25723 }, { "epoch": 0.77, "learning_rate": 6.352823040179273e-07, "loss": 1.0256, "step": 25724 }, { "epoch": 0.77, "learning_rate": 6.351198444773993e-07, "loss": 1.226, "step": 25725 }, { "epoch": 0.77, "learning_rate": 6.349574026896319e-07, "loss": 1.123, "step": 25726 }, { "epoch": 0.78, "learning_rate": 6.347949786561719e-07, "loss": 0.9713, "step": 25727 }, { "epoch": 0.78, "learning_rate": 6.346325723785663e-07, "loss": 1.1149, "step": 25728 }, { "epoch": 0.78, "learning_rate": 6.344701838583592e-07, "loss": 1.2074, "step": 25729 }, { "epoch": 0.78, "learning_rate": 6.343078130970976e-07, "loss": 1.0486, "step": 25730 }, { "epoch": 0.78, "learning_rate": 6.341454600963271e-07, "loss": 1.077, "step": 25731 }, { "epoch": 0.78, "learning_rate": 6.339831248575931e-07, "loss": 1.1266, "step": 25732 }, { "epoch": 0.78, "learning_rate": 6.33820807382442e-07, "loss": 1.0297, "step": 25733 }, { "epoch": 0.78, "learning_rate": 6.336585076724169e-07, "loss": 1.1088, "step": 25734 }, { "epoch": 0.78, "learning_rate": 6.334962257290645e-07, "loss": 1.2001, "step": 25735 }, { "epoch": 0.78, "learning_rate": 6.333339615539285e-07, "loss": 1.1266, "step": 25736 }, { "epoch": 0.78, "learning_rate": 6.331717151485545e-07, "loss": 1.2826, "step": 25737 }, { "epoch": 0.78, "learning_rate": 6.330094865144868e-07, "loss": 1.2742, "step": 25738 }, { "epoch": 0.78, "learning_rate": 6.328472756532695e-07, "loss": 1.1186, "step": 25739 }, { "epoch": 0.78, "learning_rate": 6.326850825664466e-07, "loss": 0.9572, "step": 25740 }, { "epoch": 0.78, "learning_rate": 6.325229072555634e-07, "loss": 1.0989, "step": 25741 }, { "epoch": 0.78, "learning_rate": 6.323607497221621e-07, "loss": 1.2629, "step": 25742 }, { "epoch": 0.78, "learning_rate": 6.321986099677868e-07, "loss": 1.201, "step": 25743 }, { "epoch": 0.78, "learning_rate": 6.320364879939811e-07, "loss": 1.1412, "step": 25744 }, { "epoch": 0.78, "learning_rate": 6.318743838022892e-07, "loss": 1.1494, "step": 25745 }, { "epoch": 0.78, "learning_rate": 6.317122973942527e-07, "loss": 1.1309, "step": 25746 }, { "epoch": 0.78, "learning_rate": 6.315502287714153e-07, "loss": 1.1136, "step": 25747 }, { "epoch": 0.78, "learning_rate": 6.313881779353198e-07, "loss": 0.9915, "step": 25748 }, { "epoch": 0.78, "learning_rate": 6.312261448875099e-07, "loss": 1.1429, "step": 25749 }, { "epoch": 0.78, "learning_rate": 6.310641296295261e-07, "loss": 1.017, "step": 25750 }, { "epoch": 0.78, "learning_rate": 6.309021321629116e-07, "loss": 1.1356, "step": 25751 }, { "epoch": 0.78, "learning_rate": 6.30740152489209e-07, "loss": 1.0939, "step": 25752 }, { "epoch": 0.78, "learning_rate": 6.305781906099603e-07, "loss": 1.1353, "step": 25753 }, { "epoch": 0.78, "learning_rate": 6.30416246526706e-07, "loss": 1.1011, "step": 25754 }, { "epoch": 0.78, "learning_rate": 6.302543202409888e-07, "loss": 1.068, "step": 25755 }, { "epoch": 0.78, "learning_rate": 6.300924117543503e-07, "loss": 1.1882, "step": 25756 }, { "epoch": 0.78, "learning_rate": 6.29930521068331e-07, "loss": 1.0523, "step": 25757 }, { "epoch": 0.78, "learning_rate": 6.297686481844734e-07, "loss": 1.0938, "step": 25758 }, { "epoch": 0.78, "learning_rate": 6.296067931043168e-07, "loss": 1.0439, "step": 25759 }, { "epoch": 0.78, "learning_rate": 6.294449558294028e-07, "loss": 1.0481, "step": 25760 }, { "epoch": 0.78, "learning_rate": 6.292831363612717e-07, "loss": 1.0681, "step": 25761 }, { "epoch": 0.78, "learning_rate": 6.291213347014641e-07, "loss": 1.1212, "step": 25762 }, { "epoch": 0.78, "learning_rate": 6.289595508515206e-07, "loss": 1.0913, "step": 25763 }, { "epoch": 0.78, "learning_rate": 6.287977848129812e-07, "loss": 1.0662, "step": 25764 }, { "epoch": 0.78, "learning_rate": 6.286360365873853e-07, "loss": 1.0625, "step": 25765 }, { "epoch": 0.78, "learning_rate": 6.284743061762741e-07, "loss": 1.1855, "step": 25766 }, { "epoch": 0.78, "learning_rate": 6.283125935811851e-07, "loss": 1.1253, "step": 25767 }, { "epoch": 0.78, "learning_rate": 6.281508988036589e-07, "loss": 1.1608, "step": 25768 }, { "epoch": 0.78, "learning_rate": 6.279892218452346e-07, "loss": 1.0828, "step": 25769 }, { "epoch": 0.78, "learning_rate": 6.278275627074515e-07, "loss": 1.1105, "step": 25770 }, { "epoch": 0.78, "learning_rate": 6.27665921391849e-07, "loss": 1.0607, "step": 25771 }, { "epoch": 0.78, "learning_rate": 6.275042978999643e-07, "loss": 0.9916, "step": 25772 }, { "epoch": 0.78, "learning_rate": 6.27342692233337e-07, "loss": 1.1055, "step": 25773 }, { "epoch": 0.78, "learning_rate": 6.271811043935055e-07, "loss": 1.171, "step": 25774 }, { "epoch": 0.78, "learning_rate": 6.270195343820085e-07, "loss": 1.1201, "step": 25775 }, { "epoch": 0.78, "learning_rate": 6.268579822003826e-07, "loss": 1.2386, "step": 25776 }, { "epoch": 0.78, "learning_rate": 6.266964478501666e-07, "loss": 1.014, "step": 25777 }, { "epoch": 0.78, "learning_rate": 6.265349313328984e-07, "loss": 1.1761, "step": 25778 }, { "epoch": 0.78, "learning_rate": 6.263734326501161e-07, "loss": 1.1044, "step": 25779 }, { "epoch": 0.78, "learning_rate": 6.262119518033555e-07, "loss": 1.2234, "step": 25780 }, { "epoch": 0.78, "learning_rate": 6.260504887941546e-07, "loss": 1.0886, "step": 25781 }, { "epoch": 0.78, "learning_rate": 6.258890436240505e-07, "loss": 1.142, "step": 25782 }, { "epoch": 0.78, "learning_rate": 6.257276162945802e-07, "loss": 1.0905, "step": 25783 }, { "epoch": 0.78, "learning_rate": 6.255662068072813e-07, "loss": 1.0086, "step": 25784 }, { "epoch": 0.78, "learning_rate": 6.254048151636882e-07, "loss": 1.0783, "step": 25785 }, { "epoch": 0.78, "learning_rate": 6.252434413653385e-07, "loss": 1.1701, "step": 25786 }, { "epoch": 0.78, "learning_rate": 6.250820854137685e-07, "loss": 1.1003, "step": 25787 }, { "epoch": 0.78, "learning_rate": 6.24920747310514e-07, "loss": 1.1194, "step": 25788 }, { "epoch": 0.78, "learning_rate": 6.247594270571108e-07, "loss": 1.1495, "step": 25789 }, { "epoch": 0.78, "learning_rate": 6.245981246550947e-07, "loss": 1.0508, "step": 25790 }, { "epoch": 0.78, "learning_rate": 6.244368401060013e-07, "loss": 1.0859, "step": 25791 }, { "epoch": 0.78, "learning_rate": 6.242755734113667e-07, "loss": 1.0804, "step": 25792 }, { "epoch": 0.78, "learning_rate": 6.241143245727247e-07, "loss": 1.1221, "step": 25793 }, { "epoch": 0.78, "learning_rate": 6.239530935916104e-07, "loss": 1.0278, "step": 25794 }, { "epoch": 0.78, "learning_rate": 6.237918804695594e-07, "loss": 1.1375, "step": 25795 }, { "epoch": 0.78, "learning_rate": 6.236306852081061e-07, "loss": 1.0714, "step": 25796 }, { "epoch": 0.78, "learning_rate": 6.234695078087858e-07, "loss": 1.0688, "step": 25797 }, { "epoch": 0.78, "learning_rate": 6.233083482731309e-07, "loss": 1.1301, "step": 25798 }, { "epoch": 0.78, "learning_rate": 6.23147206602677e-07, "loss": 1.2412, "step": 25799 }, { "epoch": 0.78, "learning_rate": 6.229860827989576e-07, "loss": 1.3323, "step": 25800 }, { "epoch": 0.78, "learning_rate": 6.228249768635075e-07, "loss": 1.115, "step": 25801 }, { "epoch": 0.78, "learning_rate": 6.226638887978589e-07, "loss": 1.1295, "step": 25802 }, { "epoch": 0.78, "learning_rate": 6.225028186035458e-07, "loss": 1.0023, "step": 25803 }, { "epoch": 0.78, "learning_rate": 6.223417662821018e-07, "loss": 1.0391, "step": 25804 }, { "epoch": 0.78, "learning_rate": 6.221807318350604e-07, "loss": 1.192, "step": 25805 }, { "epoch": 0.78, "learning_rate": 6.220197152639534e-07, "loss": 1.139, "step": 25806 }, { "epoch": 0.78, "learning_rate": 6.218587165703142e-07, "loss": 1.0787, "step": 25807 }, { "epoch": 0.78, "learning_rate": 6.216977357556755e-07, "loss": 1.1838, "step": 25808 }, { "epoch": 0.78, "learning_rate": 6.215367728215698e-07, "loss": 1.1594, "step": 25809 }, { "epoch": 0.78, "learning_rate": 6.2137582776953e-07, "loss": 1.0472, "step": 25810 }, { "epoch": 0.78, "learning_rate": 6.212149006010868e-07, "loss": 1.0398, "step": 25811 }, { "epoch": 0.78, "learning_rate": 6.210539913177729e-07, "loss": 1.0479, "step": 25812 }, { "epoch": 0.78, "learning_rate": 6.208930999211202e-07, "loss": 1.0859, "step": 25813 }, { "epoch": 0.78, "learning_rate": 6.2073222641266e-07, "loss": 1.0715, "step": 25814 }, { "epoch": 0.78, "learning_rate": 6.205713707939246e-07, "loss": 1.1612, "step": 25815 }, { "epoch": 0.78, "learning_rate": 6.204105330664439e-07, "loss": 1.0305, "step": 25816 }, { "epoch": 0.78, "learning_rate": 6.202497132317497e-07, "loss": 1.0942, "step": 25817 }, { "epoch": 0.78, "learning_rate": 6.20088911291373e-07, "loss": 1.2167, "step": 25818 }, { "epoch": 0.78, "learning_rate": 6.199281272468446e-07, "loss": 1.0231, "step": 25819 }, { "epoch": 0.78, "learning_rate": 6.197673610996946e-07, "loss": 1.0912, "step": 25820 }, { "epoch": 0.78, "learning_rate": 6.196066128514542e-07, "loss": 1.04, "step": 25821 }, { "epoch": 0.78, "learning_rate": 6.194458825036528e-07, "loss": 1.0959, "step": 25822 }, { "epoch": 0.78, "learning_rate": 6.192851700578218e-07, "loss": 1.2057, "step": 25823 }, { "epoch": 0.78, "learning_rate": 6.191244755154896e-07, "loss": 1.1265, "step": 25824 }, { "epoch": 0.78, "learning_rate": 6.189637988781863e-07, "loss": 1.0633, "step": 25825 }, { "epoch": 0.78, "learning_rate": 6.188031401474417e-07, "loss": 1.1176, "step": 25826 }, { "epoch": 0.78, "learning_rate": 6.186424993247861e-07, "loss": 1.0873, "step": 25827 }, { "epoch": 0.78, "learning_rate": 6.18481876411747e-07, "loss": 1.1015, "step": 25828 }, { "epoch": 0.78, "learning_rate": 6.183212714098541e-07, "loss": 1.1682, "step": 25829 }, { "epoch": 0.78, "learning_rate": 6.181606843206367e-07, "loss": 1.045, "step": 25830 }, { "epoch": 0.78, "learning_rate": 6.180001151456239e-07, "loss": 1.1589, "step": 25831 }, { "epoch": 0.78, "learning_rate": 6.17839563886343e-07, "loss": 1.1059, "step": 25832 }, { "epoch": 0.78, "learning_rate": 6.176790305443228e-07, "loss": 1.0485, "step": 25833 }, { "epoch": 0.78, "learning_rate": 6.175185151210917e-07, "loss": 1.0226, "step": 25834 }, { "epoch": 0.78, "learning_rate": 6.173580176181776e-07, "loss": 1.0142, "step": 25835 }, { "epoch": 0.78, "learning_rate": 6.171975380371092e-07, "loss": 1.2344, "step": 25836 }, { "epoch": 0.78, "learning_rate": 6.170370763794132e-07, "loss": 1.1655, "step": 25837 }, { "epoch": 0.78, "learning_rate": 6.168766326466169e-07, "loss": 1.0631, "step": 25838 }, { "epoch": 0.78, "learning_rate": 6.16716206840248e-07, "loss": 1.0297, "step": 25839 }, { "epoch": 0.78, "learning_rate": 6.165557989618348e-07, "loss": 1.0469, "step": 25840 }, { "epoch": 0.78, "learning_rate": 6.163954090129027e-07, "loss": 1.1173, "step": 25841 }, { "epoch": 0.78, "learning_rate": 6.162350369949787e-07, "loss": 1.1714, "step": 25842 }, { "epoch": 0.78, "learning_rate": 6.160746829095901e-07, "loss": 1.0473, "step": 25843 }, { "epoch": 0.78, "learning_rate": 6.159143467582632e-07, "loss": 1.0911, "step": 25844 }, { "epoch": 0.78, "learning_rate": 6.157540285425243e-07, "loss": 1.1563, "step": 25845 }, { "epoch": 0.78, "learning_rate": 6.155937282638997e-07, "loss": 1.04, "step": 25846 }, { "epoch": 0.78, "learning_rate": 6.15433445923915e-07, "loss": 1.1257, "step": 25847 }, { "epoch": 0.78, "learning_rate": 6.152731815240964e-07, "loss": 1.0673, "step": 25848 }, { "epoch": 0.78, "learning_rate": 6.151129350659702e-07, "loss": 1.1441, "step": 25849 }, { "epoch": 0.78, "learning_rate": 6.149527065510602e-07, "loss": 1.1205, "step": 25850 }, { "epoch": 0.78, "learning_rate": 6.147924959808926e-07, "loss": 1.1669, "step": 25851 }, { "epoch": 0.78, "learning_rate": 6.146323033569926e-07, "loss": 0.9853, "step": 25852 }, { "epoch": 0.78, "learning_rate": 6.144721286808855e-07, "loss": 1.0356, "step": 25853 }, { "epoch": 0.78, "learning_rate": 6.143119719540952e-07, "loss": 1.2151, "step": 25854 }, { "epoch": 0.78, "learning_rate": 6.141518331781465e-07, "loss": 1.1058, "step": 25855 }, { "epoch": 0.78, "learning_rate": 6.139917123545644e-07, "loss": 1.1956, "step": 25856 }, { "epoch": 0.78, "learning_rate": 6.138316094848734e-07, "loss": 1.1328, "step": 25857 }, { "epoch": 0.78, "learning_rate": 6.136715245705962e-07, "loss": 1.0716, "step": 25858 }, { "epoch": 0.78, "learning_rate": 6.135114576132578e-07, "loss": 1.0956, "step": 25859 }, { "epoch": 0.78, "learning_rate": 6.133514086143818e-07, "loss": 1.0724, "step": 25860 }, { "epoch": 0.78, "learning_rate": 6.131913775754916e-07, "loss": 1.1198, "step": 25861 }, { "epoch": 0.78, "learning_rate": 6.130313644981118e-07, "loss": 1.0956, "step": 25862 }, { "epoch": 0.78, "learning_rate": 6.128713693837634e-07, "loss": 1.0813, "step": 25863 }, { "epoch": 0.78, "learning_rate": 6.127113922339712e-07, "loss": 1.1141, "step": 25864 }, { "epoch": 0.78, "learning_rate": 6.125514330502572e-07, "loss": 1.1245, "step": 25865 }, { "epoch": 0.78, "learning_rate": 6.123914918341453e-07, "loss": 1.0721, "step": 25866 }, { "epoch": 0.78, "learning_rate": 6.122315685871566e-07, "loss": 1.0533, "step": 25867 }, { "epoch": 0.78, "learning_rate": 6.120716633108142e-07, "loss": 1.1564, "step": 25868 }, { "epoch": 0.78, "learning_rate": 6.119117760066406e-07, "loss": 1.2524, "step": 25869 }, { "epoch": 0.78, "learning_rate": 6.117519066761573e-07, "loss": 1.0895, "step": 25870 }, { "epoch": 0.78, "learning_rate": 6.115920553208865e-07, "loss": 1.0918, "step": 25871 }, { "epoch": 0.78, "learning_rate": 6.114322219423496e-07, "loss": 1.0905, "step": 25872 }, { "epoch": 0.78, "learning_rate": 6.112724065420686e-07, "loss": 1.1071, "step": 25873 }, { "epoch": 0.78, "learning_rate": 6.111126091215646e-07, "loss": 1.1297, "step": 25874 }, { "epoch": 0.78, "learning_rate": 6.109528296823597e-07, "loss": 1.1851, "step": 25875 }, { "epoch": 0.78, "learning_rate": 6.107930682259732e-07, "loss": 1.1498, "step": 25876 }, { "epoch": 0.78, "learning_rate": 6.106333247539268e-07, "loss": 1.1038, "step": 25877 }, { "epoch": 0.78, "learning_rate": 6.104735992677413e-07, "loss": 0.971, "step": 25878 }, { "epoch": 0.78, "learning_rate": 6.103138917689378e-07, "loss": 1.192, "step": 25879 }, { "epoch": 0.78, "learning_rate": 6.101542022590351e-07, "loss": 1.2185, "step": 25880 }, { "epoch": 0.78, "learning_rate": 6.099945307395544e-07, "loss": 1.0319, "step": 25881 }, { "epoch": 0.78, "learning_rate": 6.098348772120155e-07, "loss": 1.0756, "step": 25882 }, { "epoch": 0.78, "learning_rate": 6.09675241677939e-07, "loss": 1.1411, "step": 25883 }, { "epoch": 0.78, "learning_rate": 6.095156241388428e-07, "loss": 0.9792, "step": 25884 }, { "epoch": 0.78, "learning_rate": 6.093560245962473e-07, "loss": 1.0338, "step": 25885 }, { "epoch": 0.78, "learning_rate": 6.091964430516722e-07, "loss": 1.1767, "step": 25886 }, { "epoch": 0.78, "learning_rate": 6.090368795066362e-07, "loss": 1.2087, "step": 25887 }, { "epoch": 0.78, "learning_rate": 6.088773339626591e-07, "loss": 1.0305, "step": 25888 }, { "epoch": 0.78, "learning_rate": 6.087178064212585e-07, "loss": 1.2272, "step": 25889 }, { "epoch": 0.78, "learning_rate": 6.085582968839532e-07, "loss": 0.9708, "step": 25890 }, { "epoch": 0.78, "learning_rate": 6.083988053522621e-07, "loss": 1.1332, "step": 25891 }, { "epoch": 0.78, "learning_rate": 6.082393318277041e-07, "loss": 1.1418, "step": 25892 }, { "epoch": 0.78, "learning_rate": 6.080798763117957e-07, "loss": 1.1729, "step": 25893 }, { "epoch": 0.78, "learning_rate": 6.079204388060559e-07, "loss": 1.0756, "step": 25894 }, { "epoch": 0.78, "learning_rate": 6.07761019312002e-07, "loss": 0.9913, "step": 25895 }, { "epoch": 0.78, "learning_rate": 6.07601617831152e-07, "loss": 1.1362, "step": 25896 }, { "epoch": 0.78, "learning_rate": 6.074422343650232e-07, "loss": 1.0371, "step": 25897 }, { "epoch": 0.78, "learning_rate": 6.072828689151337e-07, "loss": 1.0992, "step": 25898 }, { "epoch": 0.78, "learning_rate": 6.071235214829988e-07, "loss": 1.1859, "step": 25899 }, { "epoch": 0.78, "learning_rate": 6.069641920701363e-07, "loss": 1.1422, "step": 25900 }, { "epoch": 0.78, "learning_rate": 6.06804880678063e-07, "loss": 1.0961, "step": 25901 }, { "epoch": 0.78, "learning_rate": 6.066455873082955e-07, "loss": 1.06, "step": 25902 }, { "epoch": 0.78, "learning_rate": 6.064863119623502e-07, "loss": 1.104, "step": 25903 }, { "epoch": 0.78, "learning_rate": 6.06327054641743e-07, "loss": 1.1028, "step": 25904 }, { "epoch": 0.78, "learning_rate": 6.061678153479914e-07, "loss": 1.2064, "step": 25905 }, { "epoch": 0.78, "learning_rate": 6.060085940826088e-07, "loss": 1.0688, "step": 25906 }, { "epoch": 0.78, "learning_rate": 6.058493908471128e-07, "loss": 1.1351, "step": 25907 }, { "epoch": 0.78, "learning_rate": 6.056902056430181e-07, "loss": 1.1432, "step": 25908 }, { "epoch": 0.78, "learning_rate": 6.055310384718408e-07, "loss": 1.1159, "step": 25909 }, { "epoch": 0.78, "learning_rate": 6.053718893350952e-07, "loss": 1.1422, "step": 25910 }, { "epoch": 0.78, "learning_rate": 6.052127582342965e-07, "loss": 1.0759, "step": 25911 }, { "epoch": 0.78, "learning_rate": 6.050536451709599e-07, "loss": 1.1248, "step": 25912 }, { "epoch": 0.78, "learning_rate": 6.048945501466e-07, "loss": 1.1754, "step": 25913 }, { "epoch": 0.78, "learning_rate": 6.047354731627319e-07, "loss": 1.066, "step": 25914 }, { "epoch": 0.78, "learning_rate": 6.045764142208685e-07, "loss": 0.9431, "step": 25915 }, { "epoch": 0.78, "learning_rate": 6.044173733225251e-07, "loss": 0.9963, "step": 25916 }, { "epoch": 0.78, "learning_rate": 6.042583504692152e-07, "loss": 1.1232, "step": 25917 }, { "epoch": 0.78, "learning_rate": 6.040993456624533e-07, "loss": 0.9661, "step": 25918 }, { "epoch": 0.78, "learning_rate": 6.039403589037521e-07, "loss": 1.1103, "step": 25919 }, { "epoch": 0.78, "learning_rate": 6.037813901946252e-07, "loss": 1.0146, "step": 25920 }, { "epoch": 0.78, "learning_rate": 6.036224395365864e-07, "loss": 1.1989, "step": 25921 }, { "epoch": 0.78, "learning_rate": 6.034635069311496e-07, "loss": 1.198, "step": 25922 }, { "epoch": 0.78, "learning_rate": 6.033045923798256e-07, "loss": 1.1309, "step": 25923 }, { "epoch": 0.78, "learning_rate": 6.031456958841286e-07, "loss": 1.0716, "step": 25924 }, { "epoch": 0.78, "learning_rate": 6.029868174455713e-07, "loss": 1.0672, "step": 25925 }, { "epoch": 0.78, "learning_rate": 6.028279570656657e-07, "loss": 1.1073, "step": 25926 }, { "epoch": 0.78, "learning_rate": 6.02669114745924e-07, "loss": 1.2131, "step": 25927 }, { "epoch": 0.78, "learning_rate": 6.025102904878588e-07, "loss": 1.1324, "step": 25928 }, { "epoch": 0.78, "learning_rate": 6.023514842929817e-07, "loss": 1.0741, "step": 25929 }, { "epoch": 0.78, "learning_rate": 6.021926961628044e-07, "loss": 1.158, "step": 25930 }, { "epoch": 0.78, "learning_rate": 6.020339260988395e-07, "loss": 1.1228, "step": 25931 }, { "epoch": 0.78, "learning_rate": 6.018751741025969e-07, "loss": 1.0685, "step": 25932 }, { "epoch": 0.78, "learning_rate": 6.017164401755882e-07, "loss": 1.0591, "step": 25933 }, { "epoch": 0.78, "learning_rate": 6.015577243193249e-07, "loss": 1.1569, "step": 25934 }, { "epoch": 0.78, "learning_rate": 6.013990265353187e-07, "loss": 1.1447, "step": 25935 }, { "epoch": 0.78, "learning_rate": 6.012403468250783e-07, "loss": 1.1533, "step": 25936 }, { "epoch": 0.78, "learning_rate": 6.010816851901155e-07, "loss": 1.213, "step": 25937 }, { "epoch": 0.78, "learning_rate": 6.009230416319403e-07, "loss": 1.0702, "step": 25938 }, { "epoch": 0.78, "learning_rate": 6.00764416152064e-07, "loss": 1.0229, "step": 25939 }, { "epoch": 0.78, "learning_rate": 6.00605808751995e-07, "loss": 1.085, "step": 25940 }, { "epoch": 0.78, "learning_rate": 6.004472194332439e-07, "loss": 1.1147, "step": 25941 }, { "epoch": 0.78, "learning_rate": 6.002886481973206e-07, "loss": 1.3005, "step": 25942 }, { "epoch": 0.78, "learning_rate": 6.001300950457343e-07, "loss": 1.0934, "step": 25943 }, { "epoch": 0.78, "learning_rate": 5.999715599799949e-07, "loss": 1.2006, "step": 25944 }, { "epoch": 0.78, "learning_rate": 5.998130430016108e-07, "loss": 1.1932, "step": 25945 }, { "epoch": 0.78, "learning_rate": 5.996545441120913e-07, "loss": 0.9888, "step": 25946 }, { "epoch": 0.78, "learning_rate": 5.994960633129454e-07, "loss": 1.0964, "step": 25947 }, { "epoch": 0.78, "learning_rate": 5.993376006056823e-07, "loss": 1.0898, "step": 25948 }, { "epoch": 0.78, "learning_rate": 5.991791559918092e-07, "loss": 1.1793, "step": 25949 }, { "epoch": 0.78, "learning_rate": 5.990207294728348e-07, "loss": 1.1887, "step": 25950 }, { "epoch": 0.78, "learning_rate": 5.988623210502678e-07, "loss": 1.1487, "step": 25951 }, { "epoch": 0.78, "learning_rate": 5.987039307256157e-07, "loss": 1.0328, "step": 25952 }, { "epoch": 0.78, "learning_rate": 5.985455585003866e-07, "loss": 1.1907, "step": 25953 }, { "epoch": 0.78, "learning_rate": 5.983872043760879e-07, "loss": 1.0598, "step": 25954 }, { "epoch": 0.78, "learning_rate": 5.982288683542273e-07, "loss": 1.0385, "step": 25955 }, { "epoch": 0.78, "learning_rate": 5.980705504363118e-07, "loss": 1.059, "step": 25956 }, { "epoch": 0.78, "learning_rate": 5.979122506238497e-07, "loss": 1.1064, "step": 25957 }, { "epoch": 0.78, "learning_rate": 5.977539689183459e-07, "loss": 1.0421, "step": 25958 }, { "epoch": 0.78, "learning_rate": 5.975957053213083e-07, "loss": 1.0635, "step": 25959 }, { "epoch": 0.78, "learning_rate": 5.974374598342431e-07, "loss": 0.9929, "step": 25960 }, { "epoch": 0.78, "learning_rate": 5.972792324586579e-07, "loss": 1.1214, "step": 25961 }, { "epoch": 0.78, "learning_rate": 5.971210231960572e-07, "loss": 1.1207, "step": 25962 }, { "epoch": 0.78, "learning_rate": 5.969628320479481e-07, "loss": 1.0422, "step": 25963 }, { "epoch": 0.78, "learning_rate": 5.96804659015836e-07, "loss": 1.1382, "step": 25964 }, { "epoch": 0.78, "learning_rate": 5.966465041012279e-07, "loss": 1.1281, "step": 25965 }, { "epoch": 0.78, "learning_rate": 5.964883673056277e-07, "loss": 1.0511, "step": 25966 }, { "epoch": 0.78, "learning_rate": 5.963302486305414e-07, "loss": 1.1815, "step": 25967 }, { "epoch": 0.78, "learning_rate": 5.961721480774743e-07, "loss": 1.2411, "step": 25968 }, { "epoch": 0.78, "learning_rate": 5.960140656479313e-07, "loss": 1.1197, "step": 25969 }, { "epoch": 0.78, "learning_rate": 5.958560013434183e-07, "loss": 1.1265, "step": 25970 }, { "epoch": 0.78, "learning_rate": 5.956979551654382e-07, "loss": 1.1278, "step": 25971 }, { "epoch": 0.78, "learning_rate": 5.955399271154966e-07, "loss": 1.1201, "step": 25972 }, { "epoch": 0.78, "learning_rate": 5.953819171950975e-07, "loss": 0.9517, "step": 25973 }, { "epoch": 0.78, "learning_rate": 5.952239254057463e-07, "loss": 1.0478, "step": 25974 }, { "epoch": 0.78, "learning_rate": 5.950659517489449e-07, "loss": 1.1782, "step": 25975 }, { "epoch": 0.78, "learning_rate": 5.949079962261984e-07, "loss": 1.0281, "step": 25976 }, { "epoch": 0.78, "learning_rate": 5.947500588390101e-07, "loss": 1.1053, "step": 25977 }, { "epoch": 0.78, "learning_rate": 5.945921395888837e-07, "loss": 1.1217, "step": 25978 }, { "epoch": 0.78, "learning_rate": 5.944342384773224e-07, "loss": 0.989, "step": 25979 }, { "epoch": 0.78, "learning_rate": 5.942763555058304e-07, "loss": 1.1234, "step": 25980 }, { "epoch": 0.78, "learning_rate": 5.941184906759087e-07, "loss": 1.1093, "step": 25981 }, { "epoch": 0.78, "learning_rate": 5.93960643989061e-07, "loss": 1.0381, "step": 25982 }, { "epoch": 0.78, "learning_rate": 5.938028154467901e-07, "loss": 1.0372, "step": 25983 }, { "epoch": 0.78, "learning_rate": 5.936450050505985e-07, "loss": 0.9922, "step": 25984 }, { "epoch": 0.78, "learning_rate": 5.934872128019881e-07, "loss": 1.1133, "step": 25985 }, { "epoch": 0.78, "learning_rate": 5.933294387024613e-07, "loss": 1.186, "step": 25986 }, { "epoch": 0.78, "learning_rate": 5.931716827535206e-07, "loss": 1.1101, "step": 25987 }, { "epoch": 0.78, "learning_rate": 5.930139449566663e-07, "loss": 1.1495, "step": 25988 }, { "epoch": 0.78, "learning_rate": 5.92856225313401e-07, "loss": 1.0881, "step": 25989 }, { "epoch": 0.78, "learning_rate": 5.926985238252259e-07, "loss": 1.0665, "step": 25990 }, { "epoch": 0.78, "learning_rate": 5.92540840493643e-07, "loss": 1.0314, "step": 25991 }, { "epoch": 0.78, "learning_rate": 5.92383175320152e-07, "loss": 1.0735, "step": 25992 }, { "epoch": 0.78, "learning_rate": 5.922255283062542e-07, "loss": 1.2356, "step": 25993 }, { "epoch": 0.78, "learning_rate": 5.920678994534507e-07, "loss": 1.0327, "step": 25994 }, { "epoch": 0.78, "learning_rate": 5.91910288763242e-07, "loss": 1.1393, "step": 25995 }, { "epoch": 0.78, "learning_rate": 5.917526962371289e-07, "loss": 1.2061, "step": 25996 }, { "epoch": 0.78, "learning_rate": 5.915951218766102e-07, "loss": 1.1241, "step": 25997 }, { "epoch": 0.78, "learning_rate": 5.914375656831872e-07, "loss": 1.1635, "step": 25998 }, { "epoch": 0.78, "learning_rate": 5.912800276583594e-07, "loss": 1.1932, "step": 25999 }, { "epoch": 0.78, "learning_rate": 5.91122507803627e-07, "loss": 1.0845, "step": 26000 }, { "epoch": 0.78, "learning_rate": 5.909650061204883e-07, "loss": 1.1069, "step": 26001 }, { "epoch": 0.78, "learning_rate": 5.908075226104432e-07, "loss": 1.0489, "step": 26002 }, { "epoch": 0.78, "learning_rate": 5.906500572749913e-07, "loss": 1.1702, "step": 26003 }, { "epoch": 0.78, "learning_rate": 5.904926101156316e-07, "loss": 1.1844, "step": 26004 }, { "epoch": 0.78, "learning_rate": 5.90335181133862e-07, "loss": 1.1249, "step": 26005 }, { "epoch": 0.78, "learning_rate": 5.90177770331182e-07, "loss": 1.1841, "step": 26006 }, { "epoch": 0.78, "learning_rate": 5.900203777090896e-07, "loss": 1.0735, "step": 26007 }, { "epoch": 0.78, "learning_rate": 5.898630032690833e-07, "loss": 1.0126, "step": 26008 }, { "epoch": 0.78, "learning_rate": 5.897056470126613e-07, "loss": 1.1013, "step": 26009 }, { "epoch": 0.78, "learning_rate": 5.895483089413217e-07, "loss": 1.0939, "step": 26010 }, { "epoch": 0.78, "learning_rate": 5.893909890565618e-07, "loss": 1.1644, "step": 26011 }, { "epoch": 0.78, "learning_rate": 5.892336873598798e-07, "loss": 1.1602, "step": 26012 }, { "epoch": 0.78, "learning_rate": 5.890764038527732e-07, "loss": 1.0306, "step": 26013 }, { "epoch": 0.78, "learning_rate": 5.889191385367385e-07, "loss": 1.2174, "step": 26014 }, { "epoch": 0.78, "learning_rate": 5.887618914132731e-07, "loss": 1.0767, "step": 26015 }, { "epoch": 0.78, "learning_rate": 5.88604662483874e-07, "loss": 1.0765, "step": 26016 }, { "epoch": 0.78, "learning_rate": 5.884474517500388e-07, "loss": 1.2534, "step": 26017 }, { "epoch": 0.78, "learning_rate": 5.882902592132622e-07, "loss": 1.067, "step": 26018 }, { "epoch": 0.78, "learning_rate": 5.881330848750419e-07, "loss": 1.1066, "step": 26019 }, { "epoch": 0.78, "learning_rate": 5.879759287368736e-07, "loss": 1.0955, "step": 26020 }, { "epoch": 0.78, "learning_rate": 5.878187908002538e-07, "loss": 1.03, "step": 26021 }, { "epoch": 0.78, "learning_rate": 5.876616710666788e-07, "loss": 1.0365, "step": 26022 }, { "epoch": 0.78, "learning_rate": 5.87504569537643e-07, "loss": 1.1227, "step": 26023 }, { "epoch": 0.78, "learning_rate": 5.873474862146425e-07, "loss": 1.0478, "step": 26024 }, { "epoch": 0.78, "learning_rate": 5.87190421099173e-07, "loss": 0.9384, "step": 26025 }, { "epoch": 0.78, "learning_rate": 5.870333741927301e-07, "loss": 1.2007, "step": 26026 }, { "epoch": 0.78, "learning_rate": 5.868763454968074e-07, "loss": 1.0778, "step": 26027 }, { "epoch": 0.78, "learning_rate": 5.867193350129003e-07, "loss": 1.0749, "step": 26028 }, { "epoch": 0.78, "learning_rate": 5.865623427425038e-07, "loss": 1.1914, "step": 26029 }, { "epoch": 0.78, "learning_rate": 5.864053686871129e-07, "loss": 1.1295, "step": 26030 }, { "epoch": 0.78, "learning_rate": 5.862484128482207e-07, "loss": 1.178, "step": 26031 }, { "epoch": 0.78, "learning_rate": 5.860914752273219e-07, "loss": 1.1066, "step": 26032 }, { "epoch": 0.78, "learning_rate": 5.859345558259106e-07, "loss": 1.165, "step": 26033 }, { "epoch": 0.78, "learning_rate": 5.857776546454802e-07, "loss": 1.0042, "step": 26034 }, { "epoch": 0.78, "learning_rate": 5.856207716875248e-07, "loss": 1.1298, "step": 26035 }, { "epoch": 0.78, "learning_rate": 5.854639069535376e-07, "loss": 1.08, "step": 26036 }, { "epoch": 0.78, "learning_rate": 5.85307060445012e-07, "loss": 1.2631, "step": 26037 }, { "epoch": 0.78, "learning_rate": 5.851502321634408e-07, "loss": 1.0446, "step": 26038 }, { "epoch": 0.78, "learning_rate": 5.849934221103182e-07, "loss": 1.2104, "step": 26039 }, { "epoch": 0.78, "learning_rate": 5.84836630287135e-07, "loss": 1.0184, "step": 26040 }, { "epoch": 0.78, "learning_rate": 5.846798566953848e-07, "loss": 1.0602, "step": 26041 }, { "epoch": 0.78, "learning_rate": 5.845231013365599e-07, "loss": 1.0975, "step": 26042 }, { "epoch": 0.78, "learning_rate": 5.843663642121533e-07, "loss": 1.1318, "step": 26043 }, { "epoch": 0.78, "learning_rate": 5.842096453236554e-07, "loss": 1.0452, "step": 26044 }, { "epoch": 0.78, "learning_rate": 5.840529446725593e-07, "loss": 1.2138, "step": 26045 }, { "epoch": 0.78, "learning_rate": 5.838962622603561e-07, "loss": 1.0746, "step": 26046 }, { "epoch": 0.78, "learning_rate": 5.83739598088538e-07, "loss": 1.1271, "step": 26047 }, { "epoch": 0.78, "learning_rate": 5.835829521585964e-07, "loss": 1.1996, "step": 26048 }, { "epoch": 0.78, "learning_rate": 5.834263244720217e-07, "loss": 1.0549, "step": 26049 }, { "epoch": 0.78, "learning_rate": 5.832697150303052e-07, "loss": 0.9641, "step": 26050 }, { "epoch": 0.78, "learning_rate": 5.831131238349378e-07, "loss": 1.1328, "step": 26051 }, { "epoch": 0.78, "learning_rate": 5.82956550887411e-07, "loss": 1.0282, "step": 26052 }, { "epoch": 0.78, "learning_rate": 5.827999961892139e-07, "loss": 1.2624, "step": 26053 }, { "epoch": 0.78, "learning_rate": 5.826434597418376e-07, "loss": 1.0692, "step": 26054 }, { "epoch": 0.78, "learning_rate": 5.824869415467718e-07, "loss": 1.1051, "step": 26055 }, { "epoch": 0.78, "learning_rate": 5.823304416055079e-07, "loss": 1.1569, "step": 26056 }, { "epoch": 0.78, "learning_rate": 5.821739599195337e-07, "loss": 1.1078, "step": 26057 }, { "epoch": 0.78, "learning_rate": 5.820174964903397e-07, "loss": 1.1502, "step": 26058 }, { "epoch": 0.79, "learning_rate": 5.818610513194156e-07, "loss": 0.9613, "step": 26059 }, { "epoch": 0.79, "learning_rate": 5.817046244082503e-07, "loss": 1.1477, "step": 26060 }, { "epoch": 0.79, "learning_rate": 5.815482157583333e-07, "loss": 1.1564, "step": 26061 }, { "epoch": 0.79, "learning_rate": 5.813918253711537e-07, "loss": 1.1728, "step": 26062 }, { "epoch": 0.79, "learning_rate": 5.812354532481995e-07, "loss": 1.1133, "step": 26063 }, { "epoch": 0.79, "learning_rate": 5.810790993909596e-07, "loss": 1.1043, "step": 26064 }, { "epoch": 0.79, "learning_rate": 5.809227638009224e-07, "loss": 1.1418, "step": 26065 }, { "epoch": 0.79, "learning_rate": 5.807664464795762e-07, "loss": 1.0935, "step": 26066 }, { "epoch": 0.79, "learning_rate": 5.80610147428409e-07, "loss": 1.0887, "step": 26067 }, { "epoch": 0.79, "learning_rate": 5.80453866648909e-07, "loss": 0.9912, "step": 26068 }, { "epoch": 0.79, "learning_rate": 5.802976041425645e-07, "loss": 1.1503, "step": 26069 }, { "epoch": 0.79, "learning_rate": 5.801413599108613e-07, "loss": 1.1028, "step": 26070 }, { "epoch": 0.79, "learning_rate": 5.799851339552878e-07, "loss": 1.0447, "step": 26071 }, { "epoch": 0.79, "learning_rate": 5.798289262773312e-07, "loss": 1.0688, "step": 26072 }, { "epoch": 0.79, "learning_rate": 5.796727368784782e-07, "loss": 1.1498, "step": 26073 }, { "epoch": 0.79, "learning_rate": 5.79516565760217e-07, "loss": 1.2463, "step": 26074 }, { "epoch": 0.79, "learning_rate": 5.793604129240321e-07, "loss": 1.1503, "step": 26075 }, { "epoch": 0.79, "learning_rate": 5.792042783714111e-07, "loss": 1.1141, "step": 26076 }, { "epoch": 0.79, "learning_rate": 5.790481621038405e-07, "loss": 1.0234, "step": 26077 }, { "epoch": 0.79, "learning_rate": 5.788920641228065e-07, "loss": 1.1349, "step": 26078 }, { "epoch": 0.79, "learning_rate": 5.787359844297946e-07, "loss": 1.1393, "step": 26079 }, { "epoch": 0.79, "learning_rate": 5.785799230262906e-07, "loss": 1.1105, "step": 26080 }, { "epoch": 0.79, "learning_rate": 5.784238799137804e-07, "loss": 1.1648, "step": 26081 }, { "epoch": 0.79, "learning_rate": 5.782678550937501e-07, "loss": 1.0644, "step": 26082 }, { "epoch": 0.79, "learning_rate": 5.781118485676834e-07, "loss": 1.0816, "step": 26083 }, { "epoch": 0.79, "learning_rate": 5.779558603370666e-07, "loss": 1.002, "step": 26084 }, { "epoch": 0.79, "learning_rate": 5.777998904033841e-07, "loss": 1.1001, "step": 26085 }, { "epoch": 0.79, "learning_rate": 5.776439387681209e-07, "loss": 1.1874, "step": 26086 }, { "epoch": 0.79, "learning_rate": 5.774880054327622e-07, "loss": 1.0787, "step": 26087 }, { "epoch": 0.79, "learning_rate": 5.773320903987912e-07, "loss": 1.1006, "step": 26088 }, { "epoch": 0.79, "learning_rate": 5.771761936676929e-07, "loss": 1.0863, "step": 26089 }, { "epoch": 0.79, "learning_rate": 5.770203152409506e-07, "loss": 1.0795, "step": 26090 }, { "epoch": 0.79, "learning_rate": 5.768644551200492e-07, "loss": 1.0014, "step": 26091 }, { "epoch": 0.79, "learning_rate": 5.76708613306472e-07, "loss": 1.1823, "step": 26092 }, { "epoch": 0.79, "learning_rate": 5.765527898017024e-07, "loss": 1.133, "step": 26093 }, { "epoch": 0.79, "learning_rate": 5.763969846072237e-07, "loss": 1.2018, "step": 26094 }, { "epoch": 0.79, "learning_rate": 5.762411977245203e-07, "loss": 1.0336, "step": 26095 }, { "epoch": 0.79, "learning_rate": 5.760854291550733e-07, "loss": 1.111, "step": 26096 }, { "epoch": 0.79, "learning_rate": 5.759296789003665e-07, "loss": 1.0111, "step": 26097 }, { "epoch": 0.79, "learning_rate": 5.757739469618826e-07, "loss": 1.1553, "step": 26098 }, { "epoch": 0.79, "learning_rate": 5.756182333411037e-07, "loss": 1.0569, "step": 26099 }, { "epoch": 0.79, "learning_rate": 5.754625380395132e-07, "loss": 1.1352, "step": 26100 }, { "epoch": 0.79, "learning_rate": 5.753068610585918e-07, "loss": 1.074, "step": 26101 }, { "epoch": 0.79, "learning_rate": 5.751512023998221e-07, "loss": 1.0257, "step": 26102 }, { "epoch": 0.79, "learning_rate": 5.749955620646858e-07, "loss": 1.0584, "step": 26103 }, { "epoch": 0.79, "learning_rate": 5.748399400546656e-07, "loss": 1.053, "step": 26104 }, { "epoch": 0.79, "learning_rate": 5.746843363712412e-07, "loss": 1.0655, "step": 26105 }, { "epoch": 0.79, "learning_rate": 5.745287510158945e-07, "loss": 1.0593, "step": 26106 }, { "epoch": 0.79, "learning_rate": 5.743731839901067e-07, "loss": 1.0192, "step": 26107 }, { "epoch": 0.79, "learning_rate": 5.742176352953596e-07, "loss": 1.0673, "step": 26108 }, { "epoch": 0.79, "learning_rate": 5.740621049331327e-07, "loss": 1.0421, "step": 26109 }, { "epoch": 0.79, "learning_rate": 5.739065929049065e-07, "loss": 1.1478, "step": 26110 }, { "epoch": 0.79, "learning_rate": 5.737510992121622e-07, "loss": 1.1243, "step": 26111 }, { "epoch": 0.79, "learning_rate": 5.735956238563803e-07, "loss": 1.1654, "step": 26112 }, { "epoch": 0.79, "learning_rate": 5.734401668390396e-07, "loss": 1.1058, "step": 26113 }, { "epoch": 0.79, "learning_rate": 5.732847281616208e-07, "loss": 1.0646, "step": 26114 }, { "epoch": 0.79, "learning_rate": 5.731293078256034e-07, "loss": 1.0027, "step": 26115 }, { "epoch": 0.79, "learning_rate": 5.729739058324668e-07, "loss": 1.1167, "step": 26116 }, { "epoch": 0.79, "learning_rate": 5.728185221836907e-07, "loss": 0.9915, "step": 26117 }, { "epoch": 0.79, "learning_rate": 5.726631568807539e-07, "loss": 1.0138, "step": 26118 }, { "epoch": 0.79, "learning_rate": 5.725078099251358e-07, "loss": 1.0403, "step": 26119 }, { "epoch": 0.79, "learning_rate": 5.723524813183151e-07, "loss": 1.0764, "step": 26120 }, { "epoch": 0.79, "learning_rate": 5.721971710617707e-07, "loss": 1.1043, "step": 26121 }, { "epoch": 0.79, "learning_rate": 5.720418791569804e-07, "loss": 1.1238, "step": 26122 }, { "epoch": 0.79, "learning_rate": 5.718866056054228e-07, "loss": 1.105, "step": 26123 }, { "epoch": 0.79, "learning_rate": 5.717313504085762e-07, "loss": 1.0122, "step": 26124 }, { "epoch": 0.79, "learning_rate": 5.71576113567919e-07, "loss": 1.171, "step": 26125 }, { "epoch": 0.79, "learning_rate": 5.714208950849279e-07, "loss": 1.0531, "step": 26126 }, { "epoch": 0.79, "learning_rate": 5.71265694961081e-07, "loss": 1.0151, "step": 26127 }, { "epoch": 0.79, "learning_rate": 5.711105131978558e-07, "loss": 1.014, "step": 26128 }, { "epoch": 0.79, "learning_rate": 5.709553497967293e-07, "loss": 1.2077, "step": 26129 }, { "epoch": 0.79, "learning_rate": 5.708002047591799e-07, "loss": 1.1494, "step": 26130 }, { "epoch": 0.79, "learning_rate": 5.706450780866823e-07, "loss": 1.025, "step": 26131 }, { "epoch": 0.79, "learning_rate": 5.704899697807145e-07, "loss": 1.1014, "step": 26132 }, { "epoch": 0.79, "learning_rate": 5.70334879842753e-07, "loss": 1.0208, "step": 26133 }, { "epoch": 0.79, "learning_rate": 5.701798082742749e-07, "loss": 1.1906, "step": 26134 }, { "epoch": 0.79, "learning_rate": 5.700247550767546e-07, "loss": 1.0904, "step": 26135 }, { "epoch": 0.79, "learning_rate": 5.698697202516693e-07, "loss": 1.2463, "step": 26136 }, { "epoch": 0.79, "learning_rate": 5.697147038004946e-07, "loss": 1.1423, "step": 26137 }, { "epoch": 0.79, "learning_rate": 5.695597057247071e-07, "loss": 1.024, "step": 26138 }, { "epoch": 0.79, "learning_rate": 5.694047260257807e-07, "loss": 1.0969, "step": 26139 }, { "epoch": 0.79, "learning_rate": 5.692497647051911e-07, "loss": 1.1025, "step": 26140 }, { "epoch": 0.79, "learning_rate": 5.690948217644143e-07, "loss": 1.0963, "step": 26141 }, { "epoch": 0.79, "learning_rate": 5.689398972049249e-07, "loss": 1.0792, "step": 26142 }, { "epoch": 0.79, "learning_rate": 5.687849910281976e-07, "loss": 1.044, "step": 26143 }, { "epoch": 0.79, "learning_rate": 5.686301032357075e-07, "loss": 1.3112, "step": 26144 }, { "epoch": 0.79, "learning_rate": 5.684752338289281e-07, "loss": 1.1542, "step": 26145 }, { "epoch": 0.79, "learning_rate": 5.683203828093342e-07, "loss": 1.1219, "step": 26146 }, { "epoch": 0.79, "learning_rate": 5.681655501784001e-07, "loss": 1.1471, "step": 26147 }, { "epoch": 0.79, "learning_rate": 5.680107359375994e-07, "loss": 1.0621, "step": 26148 }, { "epoch": 0.79, "learning_rate": 5.678559400884059e-07, "loss": 0.9938, "step": 26149 }, { "epoch": 0.79, "learning_rate": 5.677011626322936e-07, "loss": 1.0375, "step": 26150 }, { "epoch": 0.79, "learning_rate": 5.675464035707363e-07, "loss": 1.1237, "step": 26151 }, { "epoch": 0.79, "learning_rate": 5.673916629052057e-07, "loss": 1.1416, "step": 26152 }, { "epoch": 0.79, "learning_rate": 5.672369406371756e-07, "loss": 1.0695, "step": 26153 }, { "epoch": 0.79, "learning_rate": 5.670822367681189e-07, "loss": 1.0014, "step": 26154 }, { "epoch": 0.79, "learning_rate": 5.669275512995088e-07, "loss": 1.1298, "step": 26155 }, { "epoch": 0.79, "learning_rate": 5.667728842328177e-07, "loss": 1.0237, "step": 26156 }, { "epoch": 0.79, "learning_rate": 5.666182355695171e-07, "loss": 1.1639, "step": 26157 }, { "epoch": 0.79, "learning_rate": 5.664636053110797e-07, "loss": 1.137, "step": 26158 }, { "epoch": 0.79, "learning_rate": 5.663089934589777e-07, "loss": 1.1815, "step": 26159 }, { "epoch": 0.79, "learning_rate": 5.661544000146835e-07, "loss": 1.0688, "step": 26160 }, { "epoch": 0.79, "learning_rate": 5.659998249796673e-07, "loss": 1.1661, "step": 26161 }, { "epoch": 0.79, "learning_rate": 5.658452683554011e-07, "loss": 1.1038, "step": 26162 }, { "epoch": 0.79, "learning_rate": 5.656907301433565e-07, "loss": 1.1378, "step": 26163 }, { "epoch": 0.79, "learning_rate": 5.655362103450054e-07, "loss": 1.1508, "step": 26164 }, { "epoch": 0.79, "learning_rate": 5.653817089618172e-07, "loss": 1.0761, "step": 26165 }, { "epoch": 0.79, "learning_rate": 5.652272259952632e-07, "loss": 1.0959, "step": 26166 }, { "epoch": 0.79, "learning_rate": 5.650727614468143e-07, "loss": 1.1495, "step": 26167 }, { "epoch": 0.79, "learning_rate": 5.649183153179407e-07, "loss": 1.1235, "step": 26168 }, { "epoch": 0.79, "learning_rate": 5.647638876101139e-07, "loss": 1.15, "step": 26169 }, { "epoch": 0.79, "learning_rate": 5.646094783248018e-07, "loss": 1.0381, "step": 26170 }, { "epoch": 0.79, "learning_rate": 5.644550874634754e-07, "loss": 1.1296, "step": 26171 }, { "epoch": 0.79, "learning_rate": 5.643007150276045e-07, "loss": 1.1469, "step": 26172 }, { "epoch": 0.79, "learning_rate": 5.641463610186582e-07, "loss": 0.9845, "step": 26173 }, { "epoch": 0.79, "learning_rate": 5.639920254381065e-07, "loss": 1.1151, "step": 26174 }, { "epoch": 0.79, "learning_rate": 5.638377082874183e-07, "loss": 1.1166, "step": 26175 }, { "epoch": 0.79, "learning_rate": 5.636834095680624e-07, "loss": 1.0969, "step": 26176 }, { "epoch": 0.79, "learning_rate": 5.635291292815087e-07, "loss": 1.0985, "step": 26177 }, { "epoch": 0.79, "learning_rate": 5.633748674292244e-07, "loss": 1.1077, "step": 26178 }, { "epoch": 0.79, "learning_rate": 5.632206240126786e-07, "loss": 1.0905, "step": 26179 }, { "epoch": 0.79, "learning_rate": 5.630663990333399e-07, "loss": 1.1127, "step": 26180 }, { "epoch": 0.79, "learning_rate": 5.629121924926759e-07, "loss": 1.1503, "step": 26181 }, { "epoch": 0.79, "learning_rate": 5.627580043921558e-07, "loss": 1.0959, "step": 26182 }, { "epoch": 0.79, "learning_rate": 5.626038347332458e-07, "loss": 1.2095, "step": 26183 }, { "epoch": 0.79, "learning_rate": 5.62449683517414e-07, "loss": 0.9807, "step": 26184 }, { "epoch": 0.79, "learning_rate": 5.622955507461283e-07, "loss": 0.9792, "step": 26185 }, { "epoch": 0.79, "learning_rate": 5.621414364208563e-07, "loss": 1.1089, "step": 26186 }, { "epoch": 0.79, "learning_rate": 5.619873405430637e-07, "loss": 1.1275, "step": 26187 }, { "epoch": 0.79, "learning_rate": 5.618332631142184e-07, "loss": 1.1021, "step": 26188 }, { "epoch": 0.79, "learning_rate": 5.616792041357869e-07, "loss": 1.0349, "step": 26189 }, { "epoch": 0.79, "learning_rate": 5.615251636092367e-07, "loss": 1.1022, "step": 26190 }, { "epoch": 0.79, "learning_rate": 5.613711415360326e-07, "loss": 1.1184, "step": 26191 }, { "epoch": 0.79, "learning_rate": 5.612171379176414e-07, "loss": 1.1976, "step": 26192 }, { "epoch": 0.79, "learning_rate": 5.610631527555293e-07, "loss": 1.2638, "step": 26193 }, { "epoch": 0.79, "learning_rate": 5.609091860511622e-07, "loss": 1.0115, "step": 26194 }, { "epoch": 0.79, "learning_rate": 5.607552378060066e-07, "loss": 1.1169, "step": 26195 }, { "epoch": 0.79, "learning_rate": 5.606013080215265e-07, "loss": 1.1156, "step": 26196 }, { "epoch": 0.79, "learning_rate": 5.604473966991877e-07, "loss": 1.1285, "step": 26197 }, { "epoch": 0.79, "learning_rate": 5.602935038404555e-07, "loss": 1.223, "step": 26198 }, { "epoch": 0.79, "learning_rate": 5.601396294467954e-07, "loss": 1.0921, "step": 26199 }, { "epoch": 0.79, "learning_rate": 5.599857735196712e-07, "loss": 1.167, "step": 26200 }, { "epoch": 0.79, "learning_rate": 5.598319360605484e-07, "loss": 1.213, "step": 26201 }, { "epoch": 0.79, "learning_rate": 5.596781170708912e-07, "loss": 1.0827, "step": 26202 }, { "epoch": 0.79, "learning_rate": 5.595243165521644e-07, "loss": 1.145, "step": 26203 }, { "epoch": 0.79, "learning_rate": 5.593705345058309e-07, "loss": 1.1005, "step": 26204 }, { "epoch": 0.79, "learning_rate": 5.592167709333552e-07, "loss": 1.1519, "step": 26205 }, { "epoch": 0.79, "learning_rate": 5.590630258362012e-07, "loss": 1.0248, "step": 26206 }, { "epoch": 0.79, "learning_rate": 5.589092992158324e-07, "loss": 0.9836, "step": 26207 }, { "epoch": 0.79, "learning_rate": 5.587555910737127e-07, "loss": 1.1057, "step": 26208 }, { "epoch": 0.79, "learning_rate": 5.586019014113045e-07, "loss": 1.1337, "step": 26209 }, { "epoch": 0.79, "learning_rate": 5.584482302300708e-07, "loss": 1.1186, "step": 26210 }, { "epoch": 0.79, "learning_rate": 5.582945775314752e-07, "loss": 1.1272, "step": 26211 }, { "epoch": 0.79, "learning_rate": 5.581409433169807e-07, "loss": 1.0214, "step": 26212 }, { "epoch": 0.79, "learning_rate": 5.579873275880485e-07, "loss": 1.1578, "step": 26213 }, { "epoch": 0.79, "learning_rate": 5.578337303461414e-07, "loss": 1.1247, "step": 26214 }, { "epoch": 0.79, "learning_rate": 5.576801515927219e-07, "loss": 1.0699, "step": 26215 }, { "epoch": 0.79, "learning_rate": 5.575265913292527e-07, "loss": 1.0325, "step": 26216 }, { "epoch": 0.79, "learning_rate": 5.573730495571942e-07, "loss": 1.1527, "step": 26217 }, { "epoch": 0.79, "learning_rate": 5.572195262780086e-07, "loss": 1.311, "step": 26218 }, { "epoch": 0.79, "learning_rate": 5.570660214931572e-07, "loss": 1.1538, "step": 26219 }, { "epoch": 0.79, "learning_rate": 5.569125352041019e-07, "loss": 1.0728, "step": 26220 }, { "epoch": 0.79, "learning_rate": 5.567590674123038e-07, "loss": 1.1224, "step": 26221 }, { "epoch": 0.79, "learning_rate": 5.566056181192231e-07, "loss": 1.0236, "step": 26222 }, { "epoch": 0.79, "learning_rate": 5.564521873263207e-07, "loss": 1.1493, "step": 26223 }, { "epoch": 0.79, "learning_rate": 5.562987750350576e-07, "loss": 1.1501, "step": 26224 }, { "epoch": 0.79, "learning_rate": 5.561453812468939e-07, "loss": 1.076, "step": 26225 }, { "epoch": 0.79, "learning_rate": 5.559920059632901e-07, "loss": 1.0897, "step": 26226 }, { "epoch": 0.79, "learning_rate": 5.558386491857068e-07, "loss": 1.0118, "step": 26227 }, { "epoch": 0.79, "learning_rate": 5.556853109156024e-07, "loss": 1.1233, "step": 26228 }, { "epoch": 0.79, "learning_rate": 5.555319911544376e-07, "loss": 1.073, "step": 26229 }, { "epoch": 0.79, "learning_rate": 5.553786899036717e-07, "loss": 1.2617, "step": 26230 }, { "epoch": 0.79, "learning_rate": 5.552254071647642e-07, "loss": 1.2408, "step": 26231 }, { "epoch": 0.79, "learning_rate": 5.55072142939174e-07, "loss": 1.0374, "step": 26232 }, { "epoch": 0.79, "learning_rate": 5.549188972283603e-07, "loss": 1.0569, "step": 26233 }, { "epoch": 0.79, "learning_rate": 5.547656700337828e-07, "loss": 0.9506, "step": 26234 }, { "epoch": 0.79, "learning_rate": 5.546124613568984e-07, "loss": 1.0562, "step": 26235 }, { "epoch": 0.79, "learning_rate": 5.544592711991665e-07, "loss": 1.0486, "step": 26236 }, { "epoch": 0.79, "learning_rate": 5.543060995620452e-07, "loss": 1.0347, "step": 26237 }, { "epoch": 0.79, "learning_rate": 5.541529464469936e-07, "loss": 1.1159, "step": 26238 }, { "epoch": 0.79, "learning_rate": 5.539998118554682e-07, "loss": 1.0347, "step": 26239 }, { "epoch": 0.79, "learning_rate": 5.538466957889271e-07, "loss": 1.057, "step": 26240 }, { "epoch": 0.79, "learning_rate": 5.536935982488284e-07, "loss": 0.9886, "step": 26241 }, { "epoch": 0.79, "learning_rate": 5.535405192366298e-07, "loss": 1.119, "step": 26242 }, { "epoch": 0.79, "learning_rate": 5.533874587537874e-07, "loss": 1.0532, "step": 26243 }, { "epoch": 0.79, "learning_rate": 5.532344168017589e-07, "loss": 1.2326, "step": 26244 }, { "epoch": 0.79, "learning_rate": 5.530813933820012e-07, "loss": 1.0974, "step": 26245 }, { "epoch": 0.79, "learning_rate": 5.529283884959707e-07, "loss": 1.099, "step": 26246 }, { "epoch": 0.79, "learning_rate": 5.527754021451251e-07, "loss": 1.1041, "step": 26247 }, { "epoch": 0.79, "learning_rate": 5.526224343309191e-07, "loss": 1.1095, "step": 26248 }, { "epoch": 0.79, "learning_rate": 5.524694850548096e-07, "loss": 1.0181, "step": 26249 }, { "epoch": 0.79, "learning_rate": 5.523165543182529e-07, "loss": 1.1248, "step": 26250 }, { "epoch": 0.79, "learning_rate": 5.52163642122705e-07, "loss": 1.1158, "step": 26251 }, { "epoch": 0.79, "learning_rate": 5.520107484696205e-07, "loss": 1.1063, "step": 26252 }, { "epoch": 0.79, "learning_rate": 5.518578733604554e-07, "loss": 1.1225, "step": 26253 }, { "epoch": 0.79, "learning_rate": 5.517050167966653e-07, "loss": 0.9852, "step": 26254 }, { "epoch": 0.79, "learning_rate": 5.515521787797048e-07, "loss": 1.1434, "step": 26255 }, { "epoch": 0.79, "learning_rate": 5.513993593110295e-07, "loss": 1.0984, "step": 26256 }, { "epoch": 0.79, "learning_rate": 5.512465583920937e-07, "loss": 1.0445, "step": 26257 }, { "epoch": 0.79, "learning_rate": 5.510937760243521e-07, "loss": 1.0941, "step": 26258 }, { "epoch": 0.79, "learning_rate": 5.50941012209259e-07, "loss": 1.1241, "step": 26259 }, { "epoch": 0.79, "learning_rate": 5.507882669482695e-07, "loss": 1.0413, "step": 26260 }, { "epoch": 0.79, "learning_rate": 5.506355402428362e-07, "loss": 1.0664, "step": 26261 }, { "epoch": 0.79, "learning_rate": 5.504828320944139e-07, "loss": 1.067, "step": 26262 }, { "epoch": 0.79, "learning_rate": 5.50330142504456e-07, "loss": 1.0811, "step": 26263 }, { "epoch": 0.79, "learning_rate": 5.501774714744168e-07, "loss": 1.1682, "step": 26264 }, { "epoch": 0.79, "learning_rate": 5.500248190057483e-07, "loss": 1.0726, "step": 26265 }, { "epoch": 0.79, "learning_rate": 5.498721850999045e-07, "loss": 1.0935, "step": 26266 }, { "epoch": 0.79, "learning_rate": 5.497195697583383e-07, "loss": 1.1347, "step": 26267 }, { "epoch": 0.79, "learning_rate": 5.495669729825032e-07, "loss": 1.1324, "step": 26268 }, { "epoch": 0.79, "learning_rate": 5.494143947738504e-07, "loss": 1.0867, "step": 26269 }, { "epoch": 0.79, "learning_rate": 5.49261835133833e-07, "loss": 1.1094, "step": 26270 }, { "epoch": 0.79, "learning_rate": 5.491092940639037e-07, "loss": 1.0449, "step": 26271 }, { "epoch": 0.79, "learning_rate": 5.489567715655142e-07, "loss": 1.0198, "step": 26272 }, { "epoch": 0.79, "learning_rate": 5.48804267640117e-07, "loss": 1.1438, "step": 26273 }, { "epoch": 0.79, "learning_rate": 5.486517822891632e-07, "loss": 1.1507, "step": 26274 }, { "epoch": 0.79, "learning_rate": 5.484993155141044e-07, "loss": 0.9999, "step": 26275 }, { "epoch": 0.79, "learning_rate": 5.483468673163922e-07, "loss": 1.076, "step": 26276 }, { "epoch": 0.79, "learning_rate": 5.481944376974787e-07, "loss": 1.2587, "step": 26277 }, { "epoch": 0.79, "learning_rate": 5.480420266588135e-07, "loss": 1.0526, "step": 26278 }, { "epoch": 0.79, "learning_rate": 5.478896342018478e-07, "loss": 1.1592, "step": 26279 }, { "epoch": 0.79, "learning_rate": 5.477372603280329e-07, "loss": 1.1308, "step": 26280 }, { "epoch": 0.79, "learning_rate": 5.47584905038819e-07, "loss": 1.0997, "step": 26281 }, { "epoch": 0.79, "learning_rate": 5.474325683356563e-07, "loss": 1.0466, "step": 26282 }, { "epoch": 0.79, "learning_rate": 5.472802502199953e-07, "loss": 1.1276, "step": 26283 }, { "epoch": 0.79, "learning_rate": 5.471279506932859e-07, "loss": 1.0934, "step": 26284 }, { "epoch": 0.79, "learning_rate": 5.469756697569778e-07, "loss": 1.0628, "step": 26285 }, { "epoch": 0.79, "learning_rate": 5.468234074125214e-07, "loss": 1.0786, "step": 26286 }, { "epoch": 0.79, "learning_rate": 5.46671163661365e-07, "loss": 1.1591, "step": 26287 }, { "epoch": 0.79, "learning_rate": 5.465189385049582e-07, "loss": 1.059, "step": 26288 }, { "epoch": 0.79, "learning_rate": 5.463667319447503e-07, "loss": 1.0919, "step": 26289 }, { "epoch": 0.79, "learning_rate": 5.462145439821909e-07, "loss": 1.1288, "step": 26290 }, { "epoch": 0.79, "learning_rate": 5.460623746187271e-07, "loss": 1.0714, "step": 26291 }, { "epoch": 0.79, "learning_rate": 5.459102238558089e-07, "loss": 1.0832, "step": 26292 }, { "epoch": 0.79, "learning_rate": 5.457580916948841e-07, "loss": 1.2238, "step": 26293 }, { "epoch": 0.79, "learning_rate": 5.456059781374016e-07, "loss": 1.1151, "step": 26294 }, { "epoch": 0.79, "learning_rate": 5.454538831848083e-07, "loss": 1.1715, "step": 26295 }, { "epoch": 0.79, "learning_rate": 5.453018068385526e-07, "loss": 1.1923, "step": 26296 }, { "epoch": 0.79, "learning_rate": 5.451497491000826e-07, "loss": 1.0456, "step": 26297 }, { "epoch": 0.79, "learning_rate": 5.449977099708459e-07, "loss": 1.183, "step": 26298 }, { "epoch": 0.79, "learning_rate": 5.448456894522888e-07, "loss": 0.9645, "step": 26299 }, { "epoch": 0.79, "learning_rate": 5.446936875458592e-07, "loss": 1.0872, "step": 26300 }, { "epoch": 0.79, "learning_rate": 5.445417042530041e-07, "loss": 1.123, "step": 26301 }, { "epoch": 0.79, "learning_rate": 5.443897395751699e-07, "loss": 1.1412, "step": 26302 }, { "epoch": 0.79, "learning_rate": 5.442377935138044e-07, "loss": 1.063, "step": 26303 }, { "epoch": 0.79, "learning_rate": 5.440858660703524e-07, "loss": 1.0454, "step": 26304 }, { "epoch": 0.79, "learning_rate": 5.43933957246261e-07, "loss": 1.0517, "step": 26305 }, { "epoch": 0.79, "learning_rate": 5.437820670429761e-07, "loss": 1.2324, "step": 26306 }, { "epoch": 0.79, "learning_rate": 5.436301954619438e-07, "loss": 1.1418, "step": 26307 }, { "epoch": 0.79, "learning_rate": 5.4347834250461e-07, "loss": 1.0497, "step": 26308 }, { "epoch": 0.79, "learning_rate": 5.433265081724209e-07, "loss": 1.0864, "step": 26309 }, { "epoch": 0.79, "learning_rate": 5.431746924668202e-07, "loss": 1.1268, "step": 26310 }, { "epoch": 0.79, "learning_rate": 5.430228953892539e-07, "loss": 1.1505, "step": 26311 }, { "epoch": 0.79, "learning_rate": 5.428711169411671e-07, "loss": 1.0836, "step": 26312 }, { "epoch": 0.79, "learning_rate": 5.42719357124005e-07, "loss": 1.1451, "step": 26313 }, { "epoch": 0.79, "learning_rate": 5.425676159392116e-07, "loss": 1.158, "step": 26314 }, { "epoch": 0.79, "learning_rate": 5.42415893388232e-07, "loss": 1.0579, "step": 26315 }, { "epoch": 0.79, "learning_rate": 5.422641894725109e-07, "loss": 1.1528, "step": 26316 }, { "epoch": 0.79, "learning_rate": 5.42112504193491e-07, "loss": 1.1533, "step": 26317 }, { "epoch": 0.79, "learning_rate": 5.419608375526172e-07, "loss": 1.1246, "step": 26318 }, { "epoch": 0.79, "learning_rate": 5.418091895513334e-07, "loss": 1.1003, "step": 26319 }, { "epoch": 0.79, "learning_rate": 5.416575601910837e-07, "loss": 1.1191, "step": 26320 }, { "epoch": 0.79, "learning_rate": 5.415059494733099e-07, "loss": 1.0104, "step": 26321 }, { "epoch": 0.79, "learning_rate": 5.413543573994564e-07, "loss": 1.132, "step": 26322 }, { "epoch": 0.79, "learning_rate": 5.412027839709661e-07, "loss": 1.0577, "step": 26323 }, { "epoch": 0.79, "learning_rate": 5.410512291892825e-07, "loss": 1.0344, "step": 26324 }, { "epoch": 0.79, "learning_rate": 5.408996930558469e-07, "loss": 1.1421, "step": 26325 }, { "epoch": 0.79, "learning_rate": 5.407481755721031e-07, "loss": 1.0636, "step": 26326 }, { "epoch": 0.79, "learning_rate": 5.405966767394927e-07, "loss": 1.142, "step": 26327 }, { "epoch": 0.79, "learning_rate": 5.404451965594585e-07, "loss": 1.058, "step": 26328 }, { "epoch": 0.79, "learning_rate": 5.402937350334427e-07, "loss": 1.0614, "step": 26329 }, { "epoch": 0.79, "learning_rate": 5.401422921628863e-07, "loss": 1.128, "step": 26330 }, { "epoch": 0.79, "learning_rate": 5.399908679492313e-07, "loss": 1.1846, "step": 26331 }, { "epoch": 0.79, "learning_rate": 5.39839462393919e-07, "loss": 1.1201, "step": 26332 }, { "epoch": 0.79, "learning_rate": 5.396880754983921e-07, "loss": 1.0847, "step": 26333 }, { "epoch": 0.79, "learning_rate": 5.395367072640898e-07, "loss": 1.1094, "step": 26334 }, { "epoch": 0.79, "learning_rate": 5.393853576924535e-07, "loss": 1.1905, "step": 26335 }, { "epoch": 0.79, "learning_rate": 5.392340267849247e-07, "loss": 1.1326, "step": 26336 }, { "epoch": 0.79, "learning_rate": 5.390827145429436e-07, "loss": 1.0775, "step": 26337 }, { "epoch": 0.79, "learning_rate": 5.389314209679505e-07, "loss": 1.2273, "step": 26338 }, { "epoch": 0.79, "learning_rate": 5.387801460613859e-07, "loss": 1.0679, "step": 26339 }, { "epoch": 0.79, "learning_rate": 5.386288898246897e-07, "loss": 1.1761, "step": 26340 }, { "epoch": 0.79, "learning_rate": 5.384776522593019e-07, "loss": 1.019, "step": 26341 }, { "epoch": 0.79, "learning_rate": 5.383264333666627e-07, "loss": 1.1043, "step": 26342 }, { "epoch": 0.79, "learning_rate": 5.381752331482104e-07, "loss": 1.0598, "step": 26343 }, { "epoch": 0.79, "learning_rate": 5.380240516053853e-07, "loss": 1.0053, "step": 26344 }, { "epoch": 0.79, "learning_rate": 5.378728887396259e-07, "loss": 1.1342, "step": 26345 }, { "epoch": 0.79, "learning_rate": 5.377217445523725e-07, "loss": 1.0276, "step": 26346 }, { "epoch": 0.79, "learning_rate": 5.375706190450625e-07, "loss": 1.1155, "step": 26347 }, { "epoch": 0.79, "learning_rate": 5.374195122191347e-07, "loss": 1.0553, "step": 26348 }, { "epoch": 0.79, "learning_rate": 5.372684240760285e-07, "loss": 1.2493, "step": 26349 }, { "epoch": 0.79, "learning_rate": 5.371173546171817e-07, "loss": 1.1731, "step": 26350 }, { "epoch": 0.79, "learning_rate": 5.369663038440321e-07, "loss": 1.0629, "step": 26351 }, { "epoch": 0.79, "learning_rate": 5.368152717580174e-07, "loss": 1.2584, "step": 26352 }, { "epoch": 0.79, "learning_rate": 5.366642583605763e-07, "loss": 1.0189, "step": 26353 }, { "epoch": 0.79, "learning_rate": 5.365132636531456e-07, "loss": 1.2773, "step": 26354 }, { "epoch": 0.79, "learning_rate": 5.363622876371638e-07, "loss": 1.075, "step": 26355 }, { "epoch": 0.79, "learning_rate": 5.362113303140664e-07, "loss": 0.9967, "step": 26356 }, { "epoch": 0.79, "learning_rate": 5.360603916852916e-07, "loss": 1.0202, "step": 26357 }, { "epoch": 0.79, "learning_rate": 5.359094717522759e-07, "loss": 1.0887, "step": 26358 }, { "epoch": 0.79, "learning_rate": 5.357585705164567e-07, "loss": 1.0095, "step": 26359 }, { "epoch": 0.79, "learning_rate": 5.356076879792693e-07, "loss": 1.1438, "step": 26360 }, { "epoch": 0.79, "learning_rate": 5.354568241421504e-07, "loss": 1.144, "step": 26361 }, { "epoch": 0.79, "learning_rate": 5.353059790065368e-07, "loss": 1.0241, "step": 26362 }, { "epoch": 0.79, "learning_rate": 5.351551525738638e-07, "loss": 1.053, "step": 26363 }, { "epoch": 0.79, "learning_rate": 5.350043448455674e-07, "loss": 1.1162, "step": 26364 }, { "epoch": 0.79, "learning_rate": 5.348535558230833e-07, "loss": 1.1075, "step": 26365 }, { "epoch": 0.79, "learning_rate": 5.347027855078471e-07, "loss": 1.1873, "step": 26366 }, { "epoch": 0.79, "learning_rate": 5.345520339012936e-07, "loss": 1.1246, "step": 26367 }, { "epoch": 0.79, "learning_rate": 5.344013010048588e-07, "loss": 1.1957, "step": 26368 }, { "epoch": 0.79, "learning_rate": 5.342505868199765e-07, "loss": 1.2139, "step": 26369 }, { "epoch": 0.79, "learning_rate": 5.340998913480819e-07, "loss": 1.095, "step": 26370 }, { "epoch": 0.79, "learning_rate": 5.339492145906092e-07, "loss": 1.0399, "step": 26371 }, { "epoch": 0.79, "learning_rate": 5.33798556548994e-07, "loss": 1.1459, "step": 26372 }, { "epoch": 0.79, "learning_rate": 5.33647917224669e-07, "loss": 1.2216, "step": 26373 }, { "epoch": 0.79, "learning_rate": 5.334972966190685e-07, "loss": 1.2341, "step": 26374 }, { "epoch": 0.79, "learning_rate": 5.333466947336269e-07, "loss": 1.0153, "step": 26375 }, { "epoch": 0.79, "learning_rate": 5.331961115697781e-07, "loss": 0.9824, "step": 26376 }, { "epoch": 0.79, "learning_rate": 5.330455471289545e-07, "loss": 1.1543, "step": 26377 }, { "epoch": 0.79, "learning_rate": 5.328950014125899e-07, "loss": 1.0616, "step": 26378 }, { "epoch": 0.79, "learning_rate": 5.327444744221178e-07, "loss": 1.1725, "step": 26379 }, { "epoch": 0.79, "learning_rate": 5.325939661589704e-07, "loss": 1.2048, "step": 26380 }, { "epoch": 0.79, "learning_rate": 5.324434766245817e-07, "loss": 1.2656, "step": 26381 }, { "epoch": 0.79, "learning_rate": 5.322930058203829e-07, "loss": 1.073, "step": 26382 }, { "epoch": 0.79, "learning_rate": 5.32142553747807e-07, "loss": 1.0491, "step": 26383 }, { "epoch": 0.79, "learning_rate": 5.319921204082865e-07, "loss": 1.0196, "step": 26384 }, { "epoch": 0.79, "learning_rate": 5.318417058032535e-07, "loss": 1.0792, "step": 26385 }, { "epoch": 0.79, "learning_rate": 5.316913099341389e-07, "loss": 1.1011, "step": 26386 }, { "epoch": 0.79, "learning_rate": 5.315409328023752e-07, "loss": 1.1673, "step": 26387 }, { "epoch": 0.79, "learning_rate": 5.313905744093936e-07, "loss": 1.1415, "step": 26388 }, { "epoch": 0.79, "learning_rate": 5.312402347566259e-07, "loss": 1.1246, "step": 26389 }, { "epoch": 0.79, "learning_rate": 5.310899138455028e-07, "loss": 1.1038, "step": 26390 }, { "epoch": 0.8, "learning_rate": 5.309396116774562e-07, "loss": 1.1155, "step": 26391 }, { "epoch": 0.8, "learning_rate": 5.307893282539153e-07, "loss": 1.2275, "step": 26392 }, { "epoch": 0.8, "learning_rate": 5.306390635763118e-07, "loss": 1.2374, "step": 26393 }, { "epoch": 0.8, "learning_rate": 5.30488817646076e-07, "loss": 1.1155, "step": 26394 }, { "epoch": 0.8, "learning_rate": 5.303385904646377e-07, "loss": 0.9977, "step": 26395 }, { "epoch": 0.8, "learning_rate": 5.301883820334278e-07, "loss": 1.1349, "step": 26396 }, { "epoch": 0.8, "learning_rate": 5.300381923538755e-07, "loss": 1.0352, "step": 26397 }, { "epoch": 0.8, "learning_rate": 5.298880214274118e-07, "loss": 1.0829, "step": 26398 }, { "epoch": 0.8, "learning_rate": 5.297378692554647e-07, "loss": 1.2068, "step": 26399 }, { "epoch": 0.8, "learning_rate": 5.295877358394638e-07, "loss": 1.0445, "step": 26400 }, { "epoch": 0.8, "learning_rate": 5.294376211808388e-07, "loss": 1.0908, "step": 26401 }, { "epoch": 0.8, "learning_rate": 5.292875252810195e-07, "loss": 1.0714, "step": 26402 }, { "epoch": 0.8, "learning_rate": 5.29137448141433e-07, "loss": 0.9523, "step": 26403 }, { "epoch": 0.8, "learning_rate": 5.289873897635086e-07, "loss": 1.1414, "step": 26404 }, { "epoch": 0.8, "learning_rate": 5.288373501486754e-07, "loss": 1.1476, "step": 26405 }, { "epoch": 0.8, "learning_rate": 5.28687329298361e-07, "loss": 1.1286, "step": 26406 }, { "epoch": 0.8, "learning_rate": 5.285373272139946e-07, "loss": 1.1348, "step": 26407 }, { "epoch": 0.8, "learning_rate": 5.283873438970024e-07, "loss": 1.1277, "step": 26408 }, { "epoch": 0.8, "learning_rate": 5.282373793488135e-07, "loss": 1.1381, "step": 26409 }, { "epoch": 0.8, "learning_rate": 5.280874335708549e-07, "loss": 1.101, "step": 26410 }, { "epoch": 0.8, "learning_rate": 5.27937506564555e-07, "loss": 1.2411, "step": 26411 }, { "epoch": 0.8, "learning_rate": 5.277875983313397e-07, "loss": 1.1623, "step": 26412 }, { "epoch": 0.8, "learning_rate": 5.276377088726361e-07, "loss": 1.0715, "step": 26413 }, { "epoch": 0.8, "learning_rate": 5.274878381898721e-07, "loss": 0.9903, "step": 26414 }, { "epoch": 0.8, "learning_rate": 5.273379862844744e-07, "loss": 1.1605, "step": 26415 }, { "epoch": 0.8, "learning_rate": 5.271881531578682e-07, "loss": 0.9769, "step": 26416 }, { "epoch": 0.8, "learning_rate": 5.270383388114808e-07, "loss": 1.1737, "step": 26417 }, { "epoch": 0.8, "learning_rate": 5.268885432467383e-07, "loss": 1.0851, "step": 26418 }, { "epoch": 0.8, "learning_rate": 5.267387664650664e-07, "loss": 1.0342, "step": 26419 }, { "epoch": 0.8, "learning_rate": 5.265890084678913e-07, "loss": 1.1188, "step": 26420 }, { "epoch": 0.8, "learning_rate": 5.264392692566381e-07, "loss": 1.1259, "step": 26421 }, { "epoch": 0.8, "learning_rate": 5.262895488327327e-07, "loss": 1.0898, "step": 26422 }, { "epoch": 0.8, "learning_rate": 5.261398471976003e-07, "loss": 1.1078, "step": 26423 }, { "epoch": 0.8, "learning_rate": 5.259901643526666e-07, "loss": 1.2524, "step": 26424 }, { "epoch": 0.8, "learning_rate": 5.25840500299355e-07, "loss": 1.0533, "step": 26425 }, { "epoch": 0.8, "learning_rate": 5.25690855039091e-07, "loss": 1.1774, "step": 26426 }, { "epoch": 0.8, "learning_rate": 5.255412285732995e-07, "loss": 1.1307, "step": 26427 }, { "epoch": 0.8, "learning_rate": 5.253916209034049e-07, "loss": 1.026, "step": 26428 }, { "epoch": 0.8, "learning_rate": 5.252420320308307e-07, "loss": 1.041, "step": 26429 }, { "epoch": 0.8, "learning_rate": 5.25092461957001e-07, "loss": 1.0313, "step": 26430 }, { "epoch": 0.8, "learning_rate": 5.249429106833401e-07, "loss": 1.0322, "step": 26431 }, { "epoch": 0.8, "learning_rate": 5.247933782112716e-07, "loss": 1.1243, "step": 26432 }, { "epoch": 0.8, "learning_rate": 5.246438645422191e-07, "loss": 1.1309, "step": 26433 }, { "epoch": 0.8, "learning_rate": 5.244943696776053e-07, "loss": 1.0612, "step": 26434 }, { "epoch": 0.8, "learning_rate": 5.243448936188536e-07, "loss": 0.9391, "step": 26435 }, { "epoch": 0.8, "learning_rate": 5.24195436367387e-07, "loss": 1.1807, "step": 26436 }, { "epoch": 0.8, "learning_rate": 5.24045997924629e-07, "loss": 1.1188, "step": 26437 }, { "epoch": 0.8, "learning_rate": 5.238965782920005e-07, "loss": 1.0748, "step": 26438 }, { "epoch": 0.8, "learning_rate": 5.237471774709252e-07, "loss": 1.1996, "step": 26439 }, { "epoch": 0.8, "learning_rate": 5.235977954628249e-07, "loss": 1.0681, "step": 26440 }, { "epoch": 0.8, "learning_rate": 5.234484322691221e-07, "loss": 1.1228, "step": 26441 }, { "epoch": 0.8, "learning_rate": 5.232990878912381e-07, "loss": 1.0036, "step": 26442 }, { "epoch": 0.8, "learning_rate": 5.231497623305942e-07, "loss": 1.2256, "step": 26443 }, { "epoch": 0.8, "learning_rate": 5.230004555886128e-07, "loss": 1.0963, "step": 26444 }, { "epoch": 0.8, "learning_rate": 5.22851167666715e-07, "loss": 1.05, "step": 26445 }, { "epoch": 0.8, "learning_rate": 5.227018985663218e-07, "loss": 1.0901, "step": 26446 }, { "epoch": 0.8, "learning_rate": 5.225526482888541e-07, "loss": 1.0321, "step": 26447 }, { "epoch": 0.8, "learning_rate": 5.224034168357329e-07, "loss": 1.0811, "step": 26448 }, { "epoch": 0.8, "learning_rate": 5.222542042083786e-07, "loss": 0.9818, "step": 26449 }, { "epoch": 0.8, "learning_rate": 5.221050104082126e-07, "loss": 1.086, "step": 26450 }, { "epoch": 0.8, "learning_rate": 5.219558354366536e-07, "loss": 1.1136, "step": 26451 }, { "epoch": 0.8, "learning_rate": 5.218066792951224e-07, "loss": 1.0304, "step": 26452 }, { "epoch": 0.8, "learning_rate": 5.216575419850389e-07, "loss": 1.1576, "step": 26453 }, { "epoch": 0.8, "learning_rate": 5.215084235078233e-07, "loss": 1.1412, "step": 26454 }, { "epoch": 0.8, "learning_rate": 5.213593238648943e-07, "loss": 1.0572, "step": 26455 }, { "epoch": 0.8, "learning_rate": 5.212102430576713e-07, "loss": 1.0668, "step": 26456 }, { "epoch": 0.8, "learning_rate": 5.210611810875738e-07, "loss": 1.155, "step": 26457 }, { "epoch": 0.8, "learning_rate": 5.209121379560208e-07, "loss": 1.0743, "step": 26458 }, { "epoch": 0.8, "learning_rate": 5.207631136644317e-07, "loss": 1.0897, "step": 26459 }, { "epoch": 0.8, "learning_rate": 5.206141082142241e-07, "loss": 1.0643, "step": 26460 }, { "epoch": 0.8, "learning_rate": 5.204651216068166e-07, "loss": 0.9096, "step": 26461 }, { "epoch": 0.8, "learning_rate": 5.203161538436279e-07, "loss": 1.0261, "step": 26462 }, { "epoch": 0.8, "learning_rate": 5.201672049260767e-07, "loss": 0.9612, "step": 26463 }, { "epoch": 0.8, "learning_rate": 5.200182748555793e-07, "loss": 1.0782, "step": 26464 }, { "epoch": 0.8, "learning_rate": 5.198693636335544e-07, "loss": 1.0778, "step": 26465 }, { "epoch": 0.8, "learning_rate": 5.197204712614196e-07, "loss": 0.9937, "step": 26466 }, { "epoch": 0.8, "learning_rate": 5.195715977405929e-07, "loss": 1.1365, "step": 26467 }, { "epoch": 0.8, "learning_rate": 5.194227430724899e-07, "loss": 1.1455, "step": 26468 }, { "epoch": 0.8, "learning_rate": 5.192739072585287e-07, "loss": 1.2615, "step": 26469 }, { "epoch": 0.8, "learning_rate": 5.191250903001258e-07, "loss": 1.1892, "step": 26470 }, { "epoch": 0.8, "learning_rate": 5.189762921986983e-07, "loss": 1.0469, "step": 26471 }, { "epoch": 0.8, "learning_rate": 5.188275129556622e-07, "loss": 1.1715, "step": 26472 }, { "epoch": 0.8, "learning_rate": 5.186787525724338e-07, "loss": 1.1873, "step": 26473 }, { "epoch": 0.8, "learning_rate": 5.185300110504304e-07, "loss": 0.933, "step": 26474 }, { "epoch": 0.8, "learning_rate": 5.183812883910663e-07, "loss": 1.1335, "step": 26475 }, { "epoch": 0.8, "learning_rate": 5.182325845957578e-07, "loss": 1.0049, "step": 26476 }, { "epoch": 0.8, "learning_rate": 5.180838996659207e-07, "loss": 1.2094, "step": 26477 }, { "epoch": 0.8, "learning_rate": 5.179352336029705e-07, "loss": 1.1592, "step": 26478 }, { "epoch": 0.8, "learning_rate": 5.177865864083221e-07, "loss": 1.1995, "step": 26479 }, { "epoch": 0.8, "learning_rate": 5.176379580833915e-07, "loss": 1.124, "step": 26480 }, { "epoch": 0.8, "learning_rate": 5.174893486295921e-07, "loss": 1.0143, "step": 26481 }, { "epoch": 0.8, "learning_rate": 5.173407580483392e-07, "loss": 1.0646, "step": 26482 }, { "epoch": 0.8, "learning_rate": 5.171921863410476e-07, "loss": 1.1096, "step": 26483 }, { "epoch": 0.8, "learning_rate": 5.17043633509132e-07, "loss": 1.1071, "step": 26484 }, { "epoch": 0.8, "learning_rate": 5.168950995540054e-07, "loss": 1.0851, "step": 26485 }, { "epoch": 0.8, "learning_rate": 5.167465844770822e-07, "loss": 1.0455, "step": 26486 }, { "epoch": 0.8, "learning_rate": 5.165980882797764e-07, "loss": 1.1796, "step": 26487 }, { "epoch": 0.8, "learning_rate": 5.164496109635015e-07, "loss": 1.0919, "step": 26488 }, { "epoch": 0.8, "learning_rate": 5.163011525296718e-07, "loss": 1.0374, "step": 26489 }, { "epoch": 0.8, "learning_rate": 5.16152712979699e-07, "loss": 0.9885, "step": 26490 }, { "epoch": 0.8, "learning_rate": 5.160042923149969e-07, "loss": 1.1141, "step": 26491 }, { "epoch": 0.8, "learning_rate": 5.158558905369784e-07, "loss": 1.1041, "step": 26492 }, { "epoch": 0.8, "learning_rate": 5.15707507647057e-07, "loss": 1.1447, "step": 26493 }, { "epoch": 0.8, "learning_rate": 5.155591436466437e-07, "loss": 1.1255, "step": 26494 }, { "epoch": 0.8, "learning_rate": 5.154107985371517e-07, "loss": 1.1162, "step": 26495 }, { "epoch": 0.8, "learning_rate": 5.152624723199928e-07, "loss": 1.0646, "step": 26496 }, { "epoch": 0.8, "learning_rate": 5.151141649965805e-07, "loss": 1.1342, "step": 26497 }, { "epoch": 0.8, "learning_rate": 5.149658765683244e-07, "loss": 1.2705, "step": 26498 }, { "epoch": 0.8, "learning_rate": 5.14817607036637e-07, "loss": 1.0936, "step": 26499 }, { "epoch": 0.8, "learning_rate": 5.146693564029301e-07, "loss": 1.224, "step": 26500 }, { "epoch": 0.8, "learning_rate": 5.145211246686146e-07, "loss": 1.066, "step": 26501 }, { "epoch": 0.8, "learning_rate": 5.143729118351018e-07, "loss": 1.0957, "step": 26502 }, { "epoch": 0.8, "learning_rate": 5.142247179038027e-07, "loss": 1.1, "step": 26503 }, { "epoch": 0.8, "learning_rate": 5.140765428761277e-07, "loss": 1.0883, "step": 26504 }, { "epoch": 0.8, "learning_rate": 5.139283867534878e-07, "loss": 1.029, "step": 26505 }, { "epoch": 0.8, "learning_rate": 5.137802495372934e-07, "loss": 1.1457, "step": 26506 }, { "epoch": 0.8, "learning_rate": 5.136321312289541e-07, "loss": 1.2058, "step": 26507 }, { "epoch": 0.8, "learning_rate": 5.134840318298803e-07, "loss": 1.0349, "step": 26508 }, { "epoch": 0.8, "learning_rate": 5.133359513414815e-07, "loss": 1.1097, "step": 26509 }, { "epoch": 0.8, "learning_rate": 5.131878897651685e-07, "loss": 1.1035, "step": 26510 }, { "epoch": 0.8, "learning_rate": 5.130398471023492e-07, "loss": 1.0613, "step": 26511 }, { "epoch": 0.8, "learning_rate": 5.128918233544336e-07, "loss": 1.0175, "step": 26512 }, { "epoch": 0.8, "learning_rate": 5.127438185228309e-07, "loss": 1.1235, "step": 26513 }, { "epoch": 0.8, "learning_rate": 5.125958326089498e-07, "loss": 1.0873, "step": 26514 }, { "epoch": 0.8, "learning_rate": 5.124478656141998e-07, "loss": 1.0804, "step": 26515 }, { "epoch": 0.8, "learning_rate": 5.122999175399884e-07, "loss": 1.0408, "step": 26516 }, { "epoch": 0.8, "learning_rate": 5.121519883877243e-07, "loss": 1.1288, "step": 26517 }, { "epoch": 0.8, "learning_rate": 5.120040781588162e-07, "loss": 1.1123, "step": 26518 }, { "epoch": 0.8, "learning_rate": 5.118561868546724e-07, "loss": 1.125, "step": 26519 }, { "epoch": 0.8, "learning_rate": 5.117083144766993e-07, "loss": 1.1632, "step": 26520 }, { "epoch": 0.8, "learning_rate": 5.115604610263056e-07, "loss": 1.0914, "step": 26521 }, { "epoch": 0.8, "learning_rate": 5.114126265048985e-07, "loss": 1.0988, "step": 26522 }, { "epoch": 0.8, "learning_rate": 5.112648109138862e-07, "loss": 0.9608, "step": 26523 }, { "epoch": 0.8, "learning_rate": 5.111170142546745e-07, "loss": 1.2146, "step": 26524 }, { "epoch": 0.8, "learning_rate": 5.109692365286709e-07, "loss": 1.0374, "step": 26525 }, { "epoch": 0.8, "learning_rate": 5.108214777372822e-07, "loss": 1.1069, "step": 26526 }, { "epoch": 0.8, "learning_rate": 5.106737378819152e-07, "loss": 1.1495, "step": 26527 }, { "epoch": 0.8, "learning_rate": 5.105260169639759e-07, "loss": 1.0236, "step": 26528 }, { "epoch": 0.8, "learning_rate": 5.103783149848706e-07, "loss": 1.0825, "step": 26529 }, { "epoch": 0.8, "learning_rate": 5.102306319460059e-07, "loss": 1.0878, "step": 26530 }, { "epoch": 0.8, "learning_rate": 5.10082967848787e-07, "loss": 1.2156, "step": 26531 }, { "epoch": 0.8, "learning_rate": 5.099353226946208e-07, "loss": 1.1407, "step": 26532 }, { "epoch": 0.8, "learning_rate": 5.09787696484911e-07, "loss": 1.1236, "step": 26533 }, { "epoch": 0.8, "learning_rate": 5.096400892210637e-07, "loss": 0.9695, "step": 26534 }, { "epoch": 0.8, "learning_rate": 5.094925009044843e-07, "loss": 1.0109, "step": 26535 }, { "epoch": 0.8, "learning_rate": 5.093449315365784e-07, "loss": 1.2082, "step": 26536 }, { "epoch": 0.8, "learning_rate": 5.091973811187492e-07, "loss": 1.2191, "step": 26537 }, { "epoch": 0.8, "learning_rate": 5.090498496524024e-07, "loss": 0.9481, "step": 26538 }, { "epoch": 0.8, "learning_rate": 5.089023371389418e-07, "loss": 1.102, "step": 26539 }, { "epoch": 0.8, "learning_rate": 5.087548435797723e-07, "loss": 1.0886, "step": 26540 }, { "epoch": 0.8, "learning_rate": 5.086073689762983e-07, "loss": 1.0286, "step": 26541 }, { "epoch": 0.8, "learning_rate": 5.084599133299222e-07, "loss": 1.076, "step": 26542 }, { "epoch": 0.8, "learning_rate": 5.083124766420486e-07, "loss": 1.0686, "step": 26543 }, { "epoch": 0.8, "learning_rate": 5.081650589140811e-07, "loss": 1.1048, "step": 26544 }, { "epoch": 0.8, "learning_rate": 5.080176601474235e-07, "loss": 1.2372, "step": 26545 }, { "epoch": 0.8, "learning_rate": 5.078702803434779e-07, "loss": 1.1254, "step": 26546 }, { "epoch": 0.8, "learning_rate": 5.077229195036476e-07, "loss": 1.1266, "step": 26547 }, { "epoch": 0.8, "learning_rate": 5.075755776293356e-07, "loss": 1.1453, "step": 26548 }, { "epoch": 0.8, "learning_rate": 5.074282547219452e-07, "loss": 1.0429, "step": 26549 }, { "epoch": 0.8, "learning_rate": 5.072809507828778e-07, "loss": 1.0894, "step": 26550 }, { "epoch": 0.8, "learning_rate": 5.071336658135357e-07, "loss": 1.1555, "step": 26551 }, { "epoch": 0.8, "learning_rate": 5.069863998153213e-07, "loss": 1.0958, "step": 26552 }, { "epoch": 0.8, "learning_rate": 5.068391527896366e-07, "loss": 1.0743, "step": 26553 }, { "epoch": 0.8, "learning_rate": 5.066919247378832e-07, "loss": 1.2765, "step": 26554 }, { "epoch": 0.8, "learning_rate": 5.065447156614628e-07, "loss": 1.0628, "step": 26555 }, { "epoch": 0.8, "learning_rate": 5.06397525561777e-07, "loss": 1.0798, "step": 26556 }, { "epoch": 0.8, "learning_rate": 5.062503544402261e-07, "loss": 1.1554, "step": 26557 }, { "epoch": 0.8, "learning_rate": 5.061032022982115e-07, "loss": 1.0253, "step": 26558 }, { "epoch": 0.8, "learning_rate": 5.059560691371343e-07, "loss": 1.0947, "step": 26559 }, { "epoch": 0.8, "learning_rate": 5.05808954958395e-07, "loss": 1.2061, "step": 26560 }, { "epoch": 0.8, "learning_rate": 5.056618597633939e-07, "loss": 1.0081, "step": 26561 }, { "epoch": 0.8, "learning_rate": 5.05514783553532e-07, "loss": 1.1285, "step": 26562 }, { "epoch": 0.8, "learning_rate": 5.053677263302082e-07, "loss": 1.1461, "step": 26563 }, { "epoch": 0.8, "learning_rate": 5.052206880948229e-07, "loss": 1.0767, "step": 26564 }, { "epoch": 0.8, "learning_rate": 5.050736688487762e-07, "loss": 1.0685, "step": 26565 }, { "epoch": 0.8, "learning_rate": 5.04926668593467e-07, "loss": 1.1021, "step": 26566 }, { "epoch": 0.8, "learning_rate": 5.04779687330296e-07, "loss": 1.1604, "step": 26567 }, { "epoch": 0.8, "learning_rate": 5.046327250606606e-07, "loss": 1.1337, "step": 26568 }, { "epoch": 0.8, "learning_rate": 5.044857817859608e-07, "loss": 0.996, "step": 26569 }, { "epoch": 0.8, "learning_rate": 5.043388575075953e-07, "loss": 1.0599, "step": 26570 }, { "epoch": 0.8, "learning_rate": 5.041919522269631e-07, "loss": 1.0679, "step": 26571 }, { "epoch": 0.8, "learning_rate": 5.04045065945462e-07, "loss": 1.0239, "step": 26572 }, { "epoch": 0.8, "learning_rate": 5.038981986644903e-07, "loss": 1.1609, "step": 26573 }, { "epoch": 0.8, "learning_rate": 5.037513503854465e-07, "loss": 1.1208, "step": 26574 }, { "epoch": 0.8, "learning_rate": 5.036045211097293e-07, "loss": 1.1061, "step": 26575 }, { "epoch": 0.8, "learning_rate": 5.034577108387348e-07, "loss": 1.1243, "step": 26576 }, { "epoch": 0.8, "learning_rate": 5.033109195738611e-07, "loss": 1.1032, "step": 26577 }, { "epoch": 0.8, "learning_rate": 5.031641473165061e-07, "loss": 1.0242, "step": 26578 }, { "epoch": 0.8, "learning_rate": 5.030173940680666e-07, "loss": 1.1288, "step": 26579 }, { "epoch": 0.8, "learning_rate": 5.028706598299402e-07, "loss": 1.0972, "step": 26580 }, { "epoch": 0.8, "learning_rate": 5.027239446035228e-07, "loss": 1.1516, "step": 26581 }, { "epoch": 0.8, "learning_rate": 5.025772483902114e-07, "loss": 1.0814, "step": 26582 }, { "epoch": 0.8, "learning_rate": 5.024305711914026e-07, "loss": 1.1888, "step": 26583 }, { "epoch": 0.8, "learning_rate": 5.02283913008493e-07, "loss": 1.1403, "step": 26584 }, { "epoch": 0.8, "learning_rate": 5.021372738428782e-07, "loss": 1.1315, "step": 26585 }, { "epoch": 0.8, "learning_rate": 5.019906536959542e-07, "loss": 1.1039, "step": 26586 }, { "epoch": 0.8, "learning_rate": 5.01844052569117e-07, "loss": 1.0626, "step": 26587 }, { "epoch": 0.8, "learning_rate": 5.016974704637629e-07, "loss": 1.0563, "step": 26588 }, { "epoch": 0.8, "learning_rate": 5.015509073812857e-07, "loss": 1.0476, "step": 26589 }, { "epoch": 0.8, "learning_rate": 5.014043633230814e-07, "loss": 1.0573, "step": 26590 }, { "epoch": 0.8, "learning_rate": 5.01257838290545e-07, "loss": 1.0923, "step": 26591 }, { "epoch": 0.8, "learning_rate": 5.011113322850714e-07, "loss": 1.1656, "step": 26592 }, { "epoch": 0.8, "learning_rate": 5.009648453080556e-07, "loss": 1.118, "step": 26593 }, { "epoch": 0.8, "learning_rate": 5.008183773608913e-07, "loss": 1.1957, "step": 26594 }, { "epoch": 0.8, "learning_rate": 5.006719284449732e-07, "loss": 0.9793, "step": 26595 }, { "epoch": 0.8, "learning_rate": 5.005254985616953e-07, "loss": 1.083, "step": 26596 }, { "epoch": 0.8, "learning_rate": 5.003790877124526e-07, "loss": 1.0811, "step": 26597 }, { "epoch": 0.8, "learning_rate": 5.00232695898637e-07, "loss": 1.0984, "step": 26598 }, { "epoch": 0.8, "learning_rate": 5.000863231216433e-07, "loss": 1.2212, "step": 26599 }, { "epoch": 0.8, "learning_rate": 4.999399693828641e-07, "loss": 1.1971, "step": 26600 }, { "epoch": 0.8, "learning_rate": 4.997936346836943e-07, "loss": 1.0867, "step": 26601 }, { "epoch": 0.8, "learning_rate": 4.99647319025525e-07, "loss": 1.0501, "step": 26602 }, { "epoch": 0.8, "learning_rate": 4.995010224097496e-07, "loss": 1.0167, "step": 26603 }, { "epoch": 0.8, "learning_rate": 4.993547448377611e-07, "loss": 1.0903, "step": 26604 }, { "epoch": 0.8, "learning_rate": 4.992084863109519e-07, "loss": 0.9753, "step": 26605 }, { "epoch": 0.8, "learning_rate": 4.990622468307149e-07, "loss": 1.0917, "step": 26606 }, { "epoch": 0.8, "learning_rate": 4.98916026398441e-07, "loss": 1.0113, "step": 26607 }, { "epoch": 0.8, "learning_rate": 4.98769825015523e-07, "loss": 1.0452, "step": 26608 }, { "epoch": 0.8, "learning_rate": 4.986236426833521e-07, "loss": 1.0274, "step": 26609 }, { "epoch": 0.8, "learning_rate": 4.984774794033207e-07, "loss": 1.0813, "step": 26610 }, { "epoch": 0.8, "learning_rate": 4.983313351768193e-07, "loss": 1.1136, "step": 26611 }, { "epoch": 0.8, "learning_rate": 4.981852100052395e-07, "loss": 1.08, "step": 26612 }, { "epoch": 0.8, "learning_rate": 4.980391038899727e-07, "loss": 1.2363, "step": 26613 }, { "epoch": 0.8, "learning_rate": 4.9789301683241e-07, "loss": 1.0733, "step": 26614 }, { "epoch": 0.8, "learning_rate": 4.977469488339406e-07, "loss": 1.0422, "step": 26615 }, { "epoch": 0.8, "learning_rate": 4.976008998959564e-07, "loss": 1.0977, "step": 26616 }, { "epoch": 0.8, "learning_rate": 4.97454870019847e-07, "loss": 1.0081, "step": 26617 }, { "epoch": 0.8, "learning_rate": 4.973088592070027e-07, "loss": 1.0223, "step": 26618 }, { "epoch": 0.8, "learning_rate": 4.971628674588144e-07, "loss": 1.1136, "step": 26619 }, { "epoch": 0.8, "learning_rate": 4.970168947766702e-07, "loss": 1.042, "step": 26620 }, { "epoch": 0.8, "learning_rate": 4.968709411619604e-07, "loss": 1.2106, "step": 26621 }, { "epoch": 0.8, "learning_rate": 4.967250066160747e-07, "loss": 1.1032, "step": 26622 }, { "epoch": 0.8, "learning_rate": 4.965790911404025e-07, "loss": 1.0847, "step": 26623 }, { "epoch": 0.8, "learning_rate": 4.964331947363321e-07, "loss": 1.1041, "step": 26624 }, { "epoch": 0.8, "learning_rate": 4.962873174052526e-07, "loss": 1.194, "step": 26625 }, { "epoch": 0.8, "learning_rate": 4.96141459148553e-07, "loss": 1.0407, "step": 26626 }, { "epoch": 0.8, "learning_rate": 4.959956199676222e-07, "loss": 1.204, "step": 26627 }, { "epoch": 0.8, "learning_rate": 4.958497998638473e-07, "loss": 1.053, "step": 26628 }, { "epoch": 0.8, "learning_rate": 4.95703998838617e-07, "loss": 1.2064, "step": 26629 }, { "epoch": 0.8, "learning_rate": 4.955582168933193e-07, "loss": 1.0875, "step": 26630 }, { "epoch": 0.8, "learning_rate": 4.95412454029342e-07, "loss": 1.028, "step": 26631 }, { "epoch": 0.8, "learning_rate": 4.952667102480732e-07, "loss": 1.1951, "step": 26632 }, { "epoch": 0.8, "learning_rate": 4.951209855508996e-07, "loss": 1.0355, "step": 26633 }, { "epoch": 0.8, "learning_rate": 4.949752799392083e-07, "loss": 1.087, "step": 26634 }, { "epoch": 0.8, "learning_rate": 4.948295934143865e-07, "loss": 1.0961, "step": 26635 }, { "epoch": 0.8, "learning_rate": 4.946839259778216e-07, "loss": 1.1357, "step": 26636 }, { "epoch": 0.8, "learning_rate": 4.945382776308999e-07, "loss": 1.0746, "step": 26637 }, { "epoch": 0.8, "learning_rate": 4.943926483750084e-07, "loss": 1.1583, "step": 26638 }, { "epoch": 0.8, "learning_rate": 4.942470382115324e-07, "loss": 1.1035, "step": 26639 }, { "epoch": 0.8, "learning_rate": 4.941014471418587e-07, "loss": 1.175, "step": 26640 }, { "epoch": 0.8, "learning_rate": 4.939558751673732e-07, "loss": 1.1282, "step": 26641 }, { "epoch": 0.8, "learning_rate": 4.938103222894613e-07, "loss": 1.2959, "step": 26642 }, { "epoch": 0.8, "learning_rate": 4.936647885095092e-07, "loss": 1.2157, "step": 26643 }, { "epoch": 0.8, "learning_rate": 4.935192738289018e-07, "loss": 1.042, "step": 26644 }, { "epoch": 0.8, "learning_rate": 4.933737782490252e-07, "loss": 1.0693, "step": 26645 }, { "epoch": 0.8, "learning_rate": 4.932283017712636e-07, "loss": 1.0978, "step": 26646 }, { "epoch": 0.8, "learning_rate": 4.930828443970015e-07, "loss": 1.0382, "step": 26647 }, { "epoch": 0.8, "learning_rate": 4.929374061276246e-07, "loss": 1.2322, "step": 26648 }, { "epoch": 0.8, "learning_rate": 4.927919869645173e-07, "loss": 1.218, "step": 26649 }, { "epoch": 0.8, "learning_rate": 4.926465869090632e-07, "loss": 1.0464, "step": 26650 }, { "epoch": 0.8, "learning_rate": 4.925012059626466e-07, "loss": 1.1028, "step": 26651 }, { "epoch": 0.8, "learning_rate": 4.923558441266518e-07, "loss": 1.0266, "step": 26652 }, { "epoch": 0.8, "learning_rate": 4.92210501402463e-07, "loss": 1.1301, "step": 26653 }, { "epoch": 0.8, "learning_rate": 4.920651777914625e-07, "loss": 1.2329, "step": 26654 }, { "epoch": 0.8, "learning_rate": 4.919198732950348e-07, "loss": 1.1173, "step": 26655 }, { "epoch": 0.8, "learning_rate": 4.917745879145625e-07, "loss": 1.1777, "step": 26656 }, { "epoch": 0.8, "learning_rate": 4.916293216514289e-07, "loss": 1.0613, "step": 26657 }, { "epoch": 0.8, "learning_rate": 4.91484074507018e-07, "loss": 1.1031, "step": 26658 }, { "epoch": 0.8, "learning_rate": 4.913388464827102e-07, "loss": 1.1342, "step": 26659 }, { "epoch": 0.8, "learning_rate": 4.911936375798893e-07, "loss": 1.1245, "step": 26660 }, { "epoch": 0.8, "learning_rate": 4.910484477999375e-07, "loss": 1.1357, "step": 26661 }, { "epoch": 0.8, "learning_rate": 4.909032771442376e-07, "loss": 1.0288, "step": 26662 }, { "epoch": 0.8, "learning_rate": 4.907581256141705e-07, "loss": 1.1141, "step": 26663 }, { "epoch": 0.8, "learning_rate": 4.906129932111181e-07, "loss": 1.0637, "step": 26664 }, { "epoch": 0.8, "learning_rate": 4.90467879936462e-07, "loss": 1.1397, "step": 26665 }, { "epoch": 0.8, "learning_rate": 4.903227857915843e-07, "loss": 1.0149, "step": 26666 }, { "epoch": 0.8, "learning_rate": 4.901777107778657e-07, "loss": 1.1617, "step": 26667 }, { "epoch": 0.8, "learning_rate": 4.900326548966871e-07, "loss": 1.1689, "step": 26668 }, { "epoch": 0.8, "learning_rate": 4.8988761814943e-07, "loss": 1.0139, "step": 26669 }, { "epoch": 0.8, "learning_rate": 4.89742600537475e-07, "loss": 1.085, "step": 26670 }, { "epoch": 0.8, "learning_rate": 4.895976020622018e-07, "loss": 1.0521, "step": 26671 }, { "epoch": 0.8, "learning_rate": 4.89452622724991e-07, "loss": 1.0351, "step": 26672 }, { "epoch": 0.8, "learning_rate": 4.893076625272228e-07, "loss": 1.1569, "step": 26673 }, { "epoch": 0.8, "learning_rate": 4.891627214702777e-07, "loss": 1.0633, "step": 26674 }, { "epoch": 0.8, "learning_rate": 4.890177995555353e-07, "loss": 0.9084, "step": 26675 }, { "epoch": 0.8, "learning_rate": 4.888728967843745e-07, "loss": 1.0567, "step": 26676 }, { "epoch": 0.8, "learning_rate": 4.887280131581751e-07, "loss": 1.1077, "step": 26677 }, { "epoch": 0.8, "learning_rate": 4.885831486783163e-07, "loss": 1.074, "step": 26678 }, { "epoch": 0.8, "learning_rate": 4.884383033461779e-07, "loss": 1.1755, "step": 26679 }, { "epoch": 0.8, "learning_rate": 4.882934771631373e-07, "loss": 1.1857, "step": 26680 }, { "epoch": 0.8, "learning_rate": 4.881486701305738e-07, "loss": 1.0934, "step": 26681 }, { "epoch": 0.8, "learning_rate": 4.880038822498662e-07, "loss": 1.1019, "step": 26682 }, { "epoch": 0.8, "learning_rate": 4.878591135223934e-07, "loss": 1.0472, "step": 26683 }, { "epoch": 0.8, "learning_rate": 4.877143639495319e-07, "loss": 1.0364, "step": 26684 }, { "epoch": 0.8, "learning_rate": 4.875696335326608e-07, "loss": 1.2593, "step": 26685 }, { "epoch": 0.8, "learning_rate": 4.874249222731573e-07, "loss": 1.1403, "step": 26686 }, { "epoch": 0.8, "learning_rate": 4.872802301723992e-07, "loss": 1.0743, "step": 26687 }, { "epoch": 0.8, "learning_rate": 4.871355572317648e-07, "loss": 1.0808, "step": 26688 }, { "epoch": 0.8, "learning_rate": 4.869909034526296e-07, "loss": 1.0662, "step": 26689 }, { "epoch": 0.8, "learning_rate": 4.868462688363717e-07, "loss": 1.0548, "step": 26690 }, { "epoch": 0.8, "learning_rate": 4.867016533843677e-07, "loss": 1.0464, "step": 26691 }, { "epoch": 0.8, "learning_rate": 4.865570570979944e-07, "loss": 1.0463, "step": 26692 }, { "epoch": 0.8, "learning_rate": 4.86412479978628e-07, "loss": 1.2435, "step": 26693 }, { "epoch": 0.8, "learning_rate": 4.86267922027645e-07, "loss": 1.0678, "step": 26694 }, { "epoch": 0.8, "learning_rate": 4.861233832464218e-07, "loss": 1.0805, "step": 26695 }, { "epoch": 0.8, "learning_rate": 4.859788636363346e-07, "loss": 1.1094, "step": 26696 }, { "epoch": 0.8, "learning_rate": 4.858343631987581e-07, "loss": 0.9767, "step": 26697 }, { "epoch": 0.8, "learning_rate": 4.85689881935068e-07, "loss": 1.1155, "step": 26698 }, { "epoch": 0.8, "learning_rate": 4.855454198466405e-07, "loss": 0.9399, "step": 26699 }, { "epoch": 0.8, "learning_rate": 4.854009769348502e-07, "loss": 0.9948, "step": 26700 }, { "epoch": 0.8, "learning_rate": 4.852565532010731e-07, "loss": 1.1743, "step": 26701 }, { "epoch": 0.8, "learning_rate": 4.851121486466828e-07, "loss": 1.12, "step": 26702 }, { "epoch": 0.8, "learning_rate": 4.84967763273054e-07, "loss": 1.0994, "step": 26703 }, { "epoch": 0.8, "learning_rate": 4.848233970815619e-07, "loss": 1.3264, "step": 26704 }, { "epoch": 0.8, "learning_rate": 4.846790500735812e-07, "loss": 1.1763, "step": 26705 }, { "epoch": 0.8, "learning_rate": 4.845347222504845e-07, "loss": 1.0808, "step": 26706 }, { "epoch": 0.8, "learning_rate": 4.843904136136468e-07, "loss": 0.9594, "step": 26707 }, { "epoch": 0.8, "learning_rate": 4.842461241644414e-07, "loss": 1.1879, "step": 26708 }, { "epoch": 0.8, "learning_rate": 4.84101853904243e-07, "loss": 1.13, "step": 26709 }, { "epoch": 0.8, "learning_rate": 4.839576028344232e-07, "loss": 1.133, "step": 26710 }, { "epoch": 0.8, "learning_rate": 4.838133709563561e-07, "loss": 1.0695, "step": 26711 }, { "epoch": 0.8, "learning_rate": 4.836691582714145e-07, "loss": 0.9899, "step": 26712 }, { "epoch": 0.8, "learning_rate": 4.835249647809717e-07, "loss": 1.0833, "step": 26713 }, { "epoch": 0.8, "learning_rate": 4.833807904864005e-07, "loss": 1.0747, "step": 26714 }, { "epoch": 0.8, "learning_rate": 4.832366353890724e-07, "loss": 1.082, "step": 26715 }, { "epoch": 0.8, "learning_rate": 4.830924994903602e-07, "loss": 0.9834, "step": 26716 }, { "epoch": 0.8, "learning_rate": 4.829483827916362e-07, "loss": 1.1937, "step": 26717 }, { "epoch": 0.8, "learning_rate": 4.828042852942719e-07, "loss": 0.9649, "step": 26718 }, { "epoch": 0.8, "learning_rate": 4.826602069996394e-07, "loss": 1.0088, "step": 26719 }, { "epoch": 0.8, "learning_rate": 4.8251614790911e-07, "loss": 1.1026, "step": 26720 }, { "epoch": 0.8, "learning_rate": 4.823721080240562e-07, "loss": 1.0761, "step": 26721 }, { "epoch": 0.81, "learning_rate": 4.822280873458474e-07, "loss": 1.0041, "step": 26722 }, { "epoch": 0.81, "learning_rate": 4.820840858758552e-07, "loss": 1.1349, "step": 26723 }, { "epoch": 0.81, "learning_rate": 4.819401036154508e-07, "loss": 1.2547, "step": 26724 }, { "epoch": 0.81, "learning_rate": 4.817961405660046e-07, "loss": 1.0748, "step": 26725 }, { "epoch": 0.81, "learning_rate": 4.816521967288873e-07, "loss": 1.0695, "step": 26726 }, { "epoch": 0.81, "learning_rate": 4.815082721054698e-07, "loss": 1.0894, "step": 26727 }, { "epoch": 0.81, "learning_rate": 4.813643666971205e-07, "loss": 1.1099, "step": 26728 }, { "epoch": 0.81, "learning_rate": 4.812204805052101e-07, "loss": 1.1324, "step": 26729 }, { "epoch": 0.81, "learning_rate": 4.810766135311087e-07, "loss": 1.1479, "step": 26730 }, { "epoch": 0.81, "learning_rate": 4.809327657761861e-07, "loss": 1.2925, "step": 26731 }, { "epoch": 0.81, "learning_rate": 4.807889372418107e-07, "loss": 1.1049, "step": 26732 }, { "epoch": 0.81, "learning_rate": 4.80645127929352e-07, "loss": 1.0289, "step": 26733 }, { "epoch": 0.81, "learning_rate": 4.80501337840179e-07, "loss": 0.9136, "step": 26734 }, { "epoch": 0.81, "learning_rate": 4.803575669756616e-07, "loss": 1.061, "step": 26735 }, { "epoch": 0.81, "learning_rate": 4.802138153371666e-07, "loss": 1.0251, "step": 26736 }, { "epoch": 0.81, "learning_rate": 4.800700829260635e-07, "loss": 1.2432, "step": 26737 }, { "epoch": 0.81, "learning_rate": 4.799263697437201e-07, "loss": 1.0213, "step": 26738 }, { "epoch": 0.81, "learning_rate": 4.797826757915051e-07, "loss": 1.0154, "step": 26739 }, { "epoch": 0.81, "learning_rate": 4.796390010707863e-07, "loss": 1.1151, "step": 26740 }, { "epoch": 0.81, "learning_rate": 4.794953455829307e-07, "loss": 1.2255, "step": 26741 }, { "epoch": 0.81, "learning_rate": 4.793517093293063e-07, "loss": 0.9701, "step": 26742 }, { "epoch": 0.81, "learning_rate": 4.792080923112805e-07, "loss": 1.0781, "step": 26743 }, { "epoch": 0.81, "learning_rate": 4.790644945302212e-07, "loss": 1.0479, "step": 26744 }, { "epoch": 0.81, "learning_rate": 4.789209159874936e-07, "loss": 1.0458, "step": 26745 }, { "epoch": 0.81, "learning_rate": 4.787773566844658e-07, "loss": 1.1274, "step": 26746 }, { "epoch": 0.81, "learning_rate": 4.786338166225041e-07, "loss": 1.2301, "step": 26747 }, { "epoch": 0.81, "learning_rate": 4.784902958029746e-07, "loss": 1.0396, "step": 26748 }, { "epoch": 0.81, "learning_rate": 4.783467942272444e-07, "loss": 1.093, "step": 26749 }, { "epoch": 0.81, "learning_rate": 4.782033118966786e-07, "loss": 1.1595, "step": 26750 }, { "epoch": 0.81, "learning_rate": 4.780598488126437e-07, "loss": 1.074, "step": 26751 }, { "epoch": 0.81, "learning_rate": 4.779164049765053e-07, "loss": 1.1156, "step": 26752 }, { "epoch": 0.81, "learning_rate": 4.777729803896295e-07, "loss": 1.1522, "step": 26753 }, { "epoch": 0.81, "learning_rate": 4.776295750533802e-07, "loss": 1.0342, "step": 26754 }, { "epoch": 0.81, "learning_rate": 4.774861889691235e-07, "loss": 1.1772, "step": 26755 }, { "epoch": 0.81, "learning_rate": 4.773428221382242e-07, "loss": 1.1407, "step": 26756 }, { "epoch": 0.81, "learning_rate": 4.771994745620476e-07, "loss": 1.1052, "step": 26757 }, { "epoch": 0.81, "learning_rate": 4.770561462419573e-07, "loss": 1.0309, "step": 26758 }, { "epoch": 0.81, "learning_rate": 4.769128371793181e-07, "loss": 1.0909, "step": 26759 }, { "epoch": 0.81, "learning_rate": 4.7676954737549436e-07, "loss": 1.0845, "step": 26760 }, { "epoch": 0.81, "learning_rate": 4.766262768318508e-07, "loss": 1.1458, "step": 26761 }, { "epoch": 0.81, "learning_rate": 4.764830255497499e-07, "loss": 1.2075, "step": 26762 }, { "epoch": 0.81, "learning_rate": 4.763397935305561e-07, "loss": 1.0466, "step": 26763 }, { "epoch": 0.81, "learning_rate": 4.7619658077563275e-07, "loss": 1.108, "step": 26764 }, { "epoch": 0.81, "learning_rate": 4.7605338728634323e-07, "loss": 1.1584, "step": 26765 }, { "epoch": 0.81, "learning_rate": 4.7591021306405137e-07, "loss": 1.0999, "step": 26766 }, { "epoch": 0.81, "learning_rate": 4.75767058110119e-07, "loss": 1.1898, "step": 26767 }, { "epoch": 0.81, "learning_rate": 4.7562392242590903e-07, "loss": 1.2347, "step": 26768 }, { "epoch": 0.81, "learning_rate": 4.754808060127844e-07, "loss": 1.1545, "step": 26769 }, { "epoch": 0.81, "learning_rate": 4.7533770887210837e-07, "loss": 1.0637, "step": 26770 }, { "epoch": 0.81, "learning_rate": 4.751946310052413e-07, "loss": 1.1127, "step": 26771 }, { "epoch": 0.81, "learning_rate": 4.7505157241354625e-07, "loss": 1.0452, "step": 26772 }, { "epoch": 0.81, "learning_rate": 4.749085330983852e-07, "loss": 1.2263, "step": 26773 }, { "epoch": 0.81, "learning_rate": 4.7476551306111924e-07, "loss": 1.0388, "step": 26774 }, { "epoch": 0.81, "learning_rate": 4.746225123031104e-07, "loss": 1.2545, "step": 26775 }, { "epoch": 0.81, "learning_rate": 4.744795308257197e-07, "loss": 1.1263, "step": 26776 }, { "epoch": 0.81, "learning_rate": 4.7433656863030833e-07, "loss": 1.0969, "step": 26777 }, { "epoch": 0.81, "learning_rate": 4.741936257182375e-07, "loss": 1.1104, "step": 26778 }, { "epoch": 0.81, "learning_rate": 4.74050702090868e-07, "loss": 1.0707, "step": 26779 }, { "epoch": 0.81, "learning_rate": 4.7390779774955956e-07, "loss": 1.1014, "step": 26780 }, { "epoch": 0.81, "learning_rate": 4.737649126956731e-07, "loss": 1.1329, "step": 26781 }, { "epoch": 0.81, "learning_rate": 4.7362204693056886e-07, "loss": 1.1418, "step": 26782 }, { "epoch": 0.81, "learning_rate": 4.734792004556074e-07, "loss": 1.0622, "step": 26783 }, { "epoch": 0.81, "learning_rate": 4.7333637327214745e-07, "loss": 1.0623, "step": 26784 }, { "epoch": 0.81, "learning_rate": 4.7319356538154893e-07, "loss": 1.0541, "step": 26785 }, { "epoch": 0.81, "learning_rate": 4.730507767851716e-07, "loss": 1.04, "step": 26786 }, { "epoch": 0.81, "learning_rate": 4.729080074843753e-07, "loss": 1.2128, "step": 26787 }, { "epoch": 0.81, "learning_rate": 4.727652574805178e-07, "loss": 1.0996, "step": 26788 }, { "epoch": 0.81, "learning_rate": 4.726225267749587e-07, "loss": 1.1866, "step": 26789 }, { "epoch": 0.81, "learning_rate": 4.7247981536905683e-07, "loss": 1.0277, "step": 26790 }, { "epoch": 0.81, "learning_rate": 4.7233712326417046e-07, "loss": 0.9565, "step": 26791 }, { "epoch": 0.81, "learning_rate": 4.721944504616588e-07, "loss": 1.1855, "step": 26792 }, { "epoch": 0.81, "learning_rate": 4.720517969628788e-07, "loss": 1.07, "step": 26793 }, { "epoch": 0.81, "learning_rate": 4.7190916276918906e-07, "loss": 0.9344, "step": 26794 }, { "epoch": 0.81, "learning_rate": 4.717665478819472e-07, "loss": 1.0919, "step": 26795 }, { "epoch": 0.81, "learning_rate": 4.716239523025118e-07, "loss": 1.0865, "step": 26796 }, { "epoch": 0.81, "learning_rate": 4.714813760322387e-07, "loss": 1.153, "step": 26797 }, { "epoch": 0.81, "learning_rate": 4.7133881907248573e-07, "loss": 1.1696, "step": 26798 }, { "epoch": 0.81, "learning_rate": 4.711962814246104e-07, "loss": 1.0848, "step": 26799 }, { "epoch": 0.81, "learning_rate": 4.710537630899695e-07, "loss": 1.0505, "step": 26800 }, { "epoch": 0.81, "learning_rate": 4.709112640699193e-07, "loss": 1.1852, "step": 26801 }, { "epoch": 0.81, "learning_rate": 4.707687843658168e-07, "loss": 1.0508, "step": 26802 }, { "epoch": 0.81, "learning_rate": 4.7062632397901876e-07, "loss": 1.1682, "step": 26803 }, { "epoch": 0.81, "learning_rate": 4.7048388291087987e-07, "loss": 1.094, "step": 26804 }, { "epoch": 0.81, "learning_rate": 4.703414611627574e-07, "loss": 1.2061, "step": 26805 }, { "epoch": 0.81, "learning_rate": 4.701990587360064e-07, "loss": 1.1042, "step": 26806 }, { "epoch": 0.81, "learning_rate": 4.70056675631983e-07, "loss": 1.0348, "step": 26807 }, { "epoch": 0.81, "learning_rate": 4.6991431185204217e-07, "loss": 1.15, "step": 26808 }, { "epoch": 0.81, "learning_rate": 4.697719673975401e-07, "loss": 1.1415, "step": 26809 }, { "epoch": 0.81, "learning_rate": 4.696296422698304e-07, "loss": 1.0345, "step": 26810 }, { "epoch": 0.81, "learning_rate": 4.6948733647026875e-07, "loss": 1.2621, "step": 26811 }, { "epoch": 0.81, "learning_rate": 4.6934505000020974e-07, "loss": 1.0931, "step": 26812 }, { "epoch": 0.81, "learning_rate": 4.692027828610082e-07, "loss": 1.1641, "step": 26813 }, { "epoch": 0.81, "learning_rate": 4.690605350540178e-07, "loss": 1.1707, "step": 26814 }, { "epoch": 0.81, "learning_rate": 4.68918306580593e-07, "loss": 1.0214, "step": 26815 }, { "epoch": 0.81, "learning_rate": 4.6877609744208743e-07, "loss": 1.0663, "step": 26816 }, { "epoch": 0.81, "learning_rate": 4.686339076398555e-07, "loss": 1.2599, "step": 26817 }, { "epoch": 0.81, "learning_rate": 4.684917371752506e-07, "loss": 1.0677, "step": 26818 }, { "epoch": 0.81, "learning_rate": 4.6834958604962566e-07, "loss": 1.116, "step": 26819 }, { "epoch": 0.81, "learning_rate": 4.6820745426433416e-07, "loss": 1.0701, "step": 26820 }, { "epoch": 0.81, "learning_rate": 4.68065341820729e-07, "loss": 1.0383, "step": 26821 }, { "epoch": 0.81, "learning_rate": 4.6792324872016403e-07, "loss": 1.0956, "step": 26822 }, { "epoch": 0.81, "learning_rate": 4.6778117496399046e-07, "loss": 1.1339, "step": 26823 }, { "epoch": 0.81, "learning_rate": 4.67639120553561e-07, "loss": 1.2478, "step": 26824 }, { "epoch": 0.81, "learning_rate": 4.674970854902286e-07, "loss": 1.125, "step": 26825 }, { "epoch": 0.81, "learning_rate": 4.673550697753454e-07, "loss": 1.1268, "step": 26826 }, { "epoch": 0.81, "learning_rate": 4.6721307341026257e-07, "loss": 1.0191, "step": 26827 }, { "epoch": 0.81, "learning_rate": 4.6707109639633235e-07, "loss": 1.118, "step": 26828 }, { "epoch": 0.81, "learning_rate": 4.669291387349059e-07, "loss": 1.127, "step": 26829 }, { "epoch": 0.81, "learning_rate": 4.6678720042733524e-07, "loss": 1.1537, "step": 26830 }, { "epoch": 0.81, "learning_rate": 4.6664528147497086e-07, "loss": 1.1399, "step": 26831 }, { "epoch": 0.81, "learning_rate": 4.665033818791642e-07, "loss": 1.1581, "step": 26832 }, { "epoch": 0.81, "learning_rate": 4.663615016412662e-07, "loss": 1.061, "step": 26833 }, { "epoch": 0.81, "learning_rate": 4.662196407626271e-07, "loss": 0.9205, "step": 26834 }, { "epoch": 0.81, "learning_rate": 4.660777992445981e-07, "loss": 1.1005, "step": 26835 }, { "epoch": 0.81, "learning_rate": 4.659359770885283e-07, "loss": 1.1554, "step": 26836 }, { "epoch": 0.81, "learning_rate": 4.6579417429576833e-07, "loss": 1.1378, "step": 26837 }, { "epoch": 0.81, "learning_rate": 4.656523908676683e-07, "loss": 1.1924, "step": 26838 }, { "epoch": 0.81, "learning_rate": 4.6551062680557813e-07, "loss": 1.1608, "step": 26839 }, { "epoch": 0.81, "learning_rate": 4.6536888211084624e-07, "loss": 1.0491, "step": 26840 }, { "epoch": 0.81, "learning_rate": 4.6522715678482293e-07, "loss": 1.0574, "step": 26841 }, { "epoch": 0.81, "learning_rate": 4.6508545082885716e-07, "loss": 1.2547, "step": 26842 }, { "epoch": 0.81, "learning_rate": 4.649437642442975e-07, "loss": 1.1743, "step": 26843 }, { "epoch": 0.81, "learning_rate": 4.64802097032494e-07, "loss": 1.175, "step": 26844 }, { "epoch": 0.81, "learning_rate": 4.6466044919479367e-07, "loss": 1.0856, "step": 26845 }, { "epoch": 0.81, "learning_rate": 4.6451882073254574e-07, "loss": 1.1652, "step": 26846 }, { "epoch": 0.81, "learning_rate": 4.6437721164709794e-07, "loss": 1.0463, "step": 26847 }, { "epoch": 0.81, "learning_rate": 4.6423562193979976e-07, "loss": 1.0406, "step": 26848 }, { "epoch": 0.81, "learning_rate": 4.6409405161199713e-07, "loss": 1.0656, "step": 26849 }, { "epoch": 0.81, "learning_rate": 4.639525006650386e-07, "loss": 1.1301, "step": 26850 }, { "epoch": 0.81, "learning_rate": 4.6381096910027154e-07, "loss": 1.1573, "step": 26851 }, { "epoch": 0.81, "learning_rate": 4.636694569190442e-07, "loss": 1.0746, "step": 26852 }, { "epoch": 0.81, "learning_rate": 4.6352796412270225e-07, "loss": 1.1177, "step": 26853 }, { "epoch": 0.81, "learning_rate": 4.6338649071259346e-07, "loss": 1.1565, "step": 26854 }, { "epoch": 0.81, "learning_rate": 4.6324503669006426e-07, "loss": 0.9729, "step": 26855 }, { "epoch": 0.81, "learning_rate": 4.6310360205646136e-07, "loss": 1.04, "step": 26856 }, { "epoch": 0.81, "learning_rate": 4.6296218681313093e-07, "loss": 1.0792, "step": 26857 }, { "epoch": 0.81, "learning_rate": 4.6282079096141963e-07, "loss": 1.0981, "step": 26858 }, { "epoch": 0.81, "learning_rate": 4.6267941450267335e-07, "loss": 1.105, "step": 26859 }, { "epoch": 0.81, "learning_rate": 4.625380574382379e-07, "loss": 1.0643, "step": 26860 }, { "epoch": 0.81, "learning_rate": 4.6239671976945926e-07, "loss": 1.2139, "step": 26861 }, { "epoch": 0.81, "learning_rate": 4.622554014976821e-07, "loss": 1.0301, "step": 26862 }, { "epoch": 0.81, "learning_rate": 4.6211410262425175e-07, "loss": 1.1536, "step": 26863 }, { "epoch": 0.81, "learning_rate": 4.619728231505141e-07, "loss": 1.1456, "step": 26864 }, { "epoch": 0.81, "learning_rate": 4.618315630778139e-07, "loss": 0.9985, "step": 26865 }, { "epoch": 0.81, "learning_rate": 4.6169032240749506e-07, "loss": 1.0538, "step": 26866 }, { "epoch": 0.81, "learning_rate": 4.615491011409029e-07, "loss": 1.2155, "step": 26867 }, { "epoch": 0.81, "learning_rate": 4.614078992793813e-07, "loss": 1.1308, "step": 26868 }, { "epoch": 0.81, "learning_rate": 4.6126671682427545e-07, "loss": 1.1678, "step": 26869 }, { "epoch": 0.81, "learning_rate": 4.611255537769277e-07, "loss": 1.1752, "step": 26870 }, { "epoch": 0.81, "learning_rate": 4.609844101386829e-07, "loss": 1.0362, "step": 26871 }, { "epoch": 0.81, "learning_rate": 4.6084328591088467e-07, "loss": 1.0161, "step": 26872 }, { "epoch": 0.81, "learning_rate": 4.6070218109487586e-07, "loss": 1.1476, "step": 26873 }, { "epoch": 0.81, "learning_rate": 4.605610956920012e-07, "loss": 1.0309, "step": 26874 }, { "epoch": 0.81, "learning_rate": 4.6042002970360183e-07, "loss": 1.2559, "step": 26875 }, { "epoch": 0.81, "learning_rate": 4.6027898313102144e-07, "loss": 1.1044, "step": 26876 }, { "epoch": 0.81, "learning_rate": 4.601379559756028e-07, "loss": 0.9716, "step": 26877 }, { "epoch": 0.81, "learning_rate": 4.59996948238689e-07, "loss": 1.0435, "step": 26878 }, { "epoch": 0.81, "learning_rate": 4.5985595992162123e-07, "loss": 1.0705, "step": 26879 }, { "epoch": 0.81, "learning_rate": 4.59714991025742e-07, "loss": 1.2331, "step": 26880 }, { "epoch": 0.81, "learning_rate": 4.595740415523936e-07, "loss": 1.2541, "step": 26881 }, { "epoch": 0.81, "learning_rate": 4.5943311150291744e-07, "loss": 1.0819, "step": 26882 }, { "epoch": 0.81, "learning_rate": 4.5929220087865546e-07, "loss": 1.0897, "step": 26883 }, { "epoch": 0.81, "learning_rate": 4.5915130968094854e-07, "loss": 1.0803, "step": 26884 }, { "epoch": 0.81, "learning_rate": 4.590104379111393e-07, "loss": 1.0375, "step": 26885 }, { "epoch": 0.81, "learning_rate": 4.5886958557056685e-07, "loss": 1.0094, "step": 26886 }, { "epoch": 0.81, "learning_rate": 4.58728752660573e-07, "loss": 1.252, "step": 26887 }, { "epoch": 0.81, "learning_rate": 4.5858793918249825e-07, "loss": 1.129, "step": 26888 }, { "epoch": 0.81, "learning_rate": 4.584471451376832e-07, "loss": 1.1033, "step": 26889 }, { "epoch": 0.81, "learning_rate": 4.583063705274679e-07, "loss": 1.1409, "step": 26890 }, { "epoch": 0.81, "learning_rate": 4.5816561535319353e-07, "loss": 1.0768, "step": 26891 }, { "epoch": 0.81, "learning_rate": 4.5802487961619845e-07, "loss": 1.0822, "step": 26892 }, { "epoch": 0.81, "learning_rate": 4.57884163317823e-07, "loss": 1.0539, "step": 26893 }, { "epoch": 0.81, "learning_rate": 4.577434664594069e-07, "loss": 0.9732, "step": 26894 }, { "epoch": 0.81, "learning_rate": 4.576027890422899e-07, "loss": 1.0386, "step": 26895 }, { "epoch": 0.81, "learning_rate": 4.5746213106781014e-07, "loss": 1.1501, "step": 26896 }, { "epoch": 0.81, "learning_rate": 4.5732149253730707e-07, "loss": 1.0229, "step": 26897 }, { "epoch": 0.81, "learning_rate": 4.571808734521196e-07, "loss": 1.1439, "step": 26898 }, { "epoch": 0.81, "learning_rate": 4.5704027381358653e-07, "loss": 1.1054, "step": 26899 }, { "epoch": 0.81, "learning_rate": 4.568996936230466e-07, "loss": 1.1147, "step": 26900 }, { "epoch": 0.81, "learning_rate": 4.5675913288183716e-07, "loss": 1.0793, "step": 26901 }, { "epoch": 0.81, "learning_rate": 4.5661859159129654e-07, "loss": 1.1259, "step": 26902 }, { "epoch": 0.81, "learning_rate": 4.5647806975276295e-07, "loss": 1.0418, "step": 26903 }, { "epoch": 0.81, "learning_rate": 4.563375673675743e-07, "loss": 1.0876, "step": 26904 }, { "epoch": 0.81, "learning_rate": 4.5619708443706723e-07, "loss": 1.0693, "step": 26905 }, { "epoch": 0.81, "learning_rate": 4.5605662096257967e-07, "loss": 1.1941, "step": 26906 }, { "epoch": 0.81, "learning_rate": 4.559161769454487e-07, "loss": 0.9527, "step": 26907 }, { "epoch": 0.81, "learning_rate": 4.557757523870118e-07, "loss": 1.0644, "step": 26908 }, { "epoch": 0.81, "learning_rate": 4.5563534728860464e-07, "loss": 1.0621, "step": 26909 }, { "epoch": 0.81, "learning_rate": 4.5549496165156443e-07, "loss": 1.0721, "step": 26910 }, { "epoch": 0.81, "learning_rate": 4.553545954772273e-07, "loss": 1.1893, "step": 26911 }, { "epoch": 0.81, "learning_rate": 4.5521424876693006e-07, "loss": 1.1827, "step": 26912 }, { "epoch": 0.81, "learning_rate": 4.550739215220082e-07, "loss": 1.1478, "step": 26913 }, { "epoch": 0.81, "learning_rate": 4.549336137437976e-07, "loss": 1.102, "step": 26914 }, { "epoch": 0.81, "learning_rate": 4.5479332543363397e-07, "loss": 1.1525, "step": 26915 }, { "epoch": 0.81, "learning_rate": 4.5465305659285306e-07, "loss": 1.1483, "step": 26916 }, { "epoch": 0.81, "learning_rate": 4.5451280722279055e-07, "loss": 1.1174, "step": 26917 }, { "epoch": 0.81, "learning_rate": 4.5437257732478064e-07, "loss": 1.0838, "step": 26918 }, { "epoch": 0.81, "learning_rate": 4.5423236690015834e-07, "loss": 1.1396, "step": 26919 }, { "epoch": 0.81, "learning_rate": 4.540921759502584e-07, "loss": 1.1346, "step": 26920 }, { "epoch": 0.81, "learning_rate": 4.5395200447641646e-07, "loss": 1.0469, "step": 26921 }, { "epoch": 0.81, "learning_rate": 4.538118524799656e-07, "loss": 1.0513, "step": 26922 }, { "epoch": 0.81, "learning_rate": 4.5367171996224007e-07, "loss": 1.1741, "step": 26923 }, { "epoch": 0.81, "learning_rate": 4.5353160692457433e-07, "loss": 1.2139, "step": 26924 }, { "epoch": 0.81, "learning_rate": 4.533915133683023e-07, "loss": 1.0376, "step": 26925 }, { "epoch": 0.81, "learning_rate": 4.532514392947576e-07, "loss": 1.084, "step": 26926 }, { "epoch": 0.81, "learning_rate": 4.5311138470527315e-07, "loss": 1.0602, "step": 26927 }, { "epoch": 0.81, "learning_rate": 4.5297134960118257e-07, "loss": 1.1161, "step": 26928 }, { "epoch": 0.81, "learning_rate": 4.5283133398381863e-07, "loss": 0.9973, "step": 26929 }, { "epoch": 0.81, "learning_rate": 4.5269133785451505e-07, "loss": 1.1378, "step": 26930 }, { "epoch": 0.81, "learning_rate": 4.5255136121460345e-07, "loss": 1.1055, "step": 26931 }, { "epoch": 0.81, "learning_rate": 4.524114040654168e-07, "loss": 1.1993, "step": 26932 }, { "epoch": 0.81, "learning_rate": 4.5227146640828723e-07, "loss": 1.1249, "step": 26933 }, { "epoch": 0.81, "learning_rate": 4.521315482445479e-07, "loss": 1.0305, "step": 26934 }, { "epoch": 0.81, "learning_rate": 4.5199164957552915e-07, "loss": 1.1716, "step": 26935 }, { "epoch": 0.81, "learning_rate": 4.5185177040256376e-07, "loss": 1.0891, "step": 26936 }, { "epoch": 0.81, "learning_rate": 4.51711910726983e-07, "loss": 1.1487, "step": 26937 }, { "epoch": 0.81, "learning_rate": 4.5157207055011836e-07, "loss": 1.1089, "step": 26938 }, { "epoch": 0.81, "learning_rate": 4.5143224987330094e-07, "loss": 1.1023, "step": 26939 }, { "epoch": 0.81, "learning_rate": 4.5129244869786203e-07, "loss": 1.1308, "step": 26940 }, { "epoch": 0.81, "learning_rate": 4.5115266702513205e-07, "loss": 0.9907, "step": 26941 }, { "epoch": 0.81, "learning_rate": 4.510129048564421e-07, "loss": 1.1149, "step": 26942 }, { "epoch": 0.81, "learning_rate": 4.508731621931234e-07, "loss": 1.1107, "step": 26943 }, { "epoch": 0.81, "learning_rate": 4.5073343903650426e-07, "loss": 0.9819, "step": 26944 }, { "epoch": 0.81, "learning_rate": 4.5059373538791585e-07, "loss": 1.1106, "step": 26945 }, { "epoch": 0.81, "learning_rate": 4.5045405124868823e-07, "loss": 1.1476, "step": 26946 }, { "epoch": 0.81, "learning_rate": 4.5031438662015146e-07, "loss": 1.1009, "step": 26947 }, { "epoch": 0.81, "learning_rate": 4.5017474150363394e-07, "loss": 1.1396, "step": 26948 }, { "epoch": 0.81, "learning_rate": 4.500351159004657e-07, "loss": 1.1128, "step": 26949 }, { "epoch": 0.81, "learning_rate": 4.498955098119759e-07, "loss": 1.1456, "step": 26950 }, { "epoch": 0.81, "learning_rate": 4.4975592323949354e-07, "loss": 1.041, "step": 26951 }, { "epoch": 0.81, "learning_rate": 4.496163561843478e-07, "loss": 1.0252, "step": 26952 }, { "epoch": 0.81, "learning_rate": 4.4947680864786627e-07, "loss": 0.9406, "step": 26953 }, { "epoch": 0.81, "learning_rate": 4.493372806313781e-07, "loss": 1.1495, "step": 26954 }, { "epoch": 0.81, "learning_rate": 4.491977721362112e-07, "loss": 1.0377, "step": 26955 }, { "epoch": 0.81, "learning_rate": 4.4905828316369445e-07, "loss": 1.0936, "step": 26956 }, { "epoch": 0.81, "learning_rate": 4.4891881371515453e-07, "loss": 1.0861, "step": 26957 }, { "epoch": 0.81, "learning_rate": 4.487793637919197e-07, "loss": 1.1281, "step": 26958 }, { "epoch": 0.81, "learning_rate": 4.486399333953173e-07, "loss": 1.2089, "step": 26959 }, { "epoch": 0.81, "learning_rate": 4.4850052252667557e-07, "loss": 1.1499, "step": 26960 }, { "epoch": 0.81, "learning_rate": 4.483611311873201e-07, "loss": 1.1607, "step": 26961 }, { "epoch": 0.81, "learning_rate": 4.482217593785784e-07, "loss": 1.0571, "step": 26962 }, { "epoch": 0.81, "learning_rate": 4.480824071017778e-07, "loss": 1.1245, "step": 26963 }, { "epoch": 0.81, "learning_rate": 4.479430743582441e-07, "loss": 1.1641, "step": 26964 }, { "epoch": 0.81, "learning_rate": 4.478037611493041e-07, "loss": 0.9814, "step": 26965 }, { "epoch": 0.81, "learning_rate": 4.4766446747628396e-07, "loss": 1.1105, "step": 26966 }, { "epoch": 0.81, "learning_rate": 4.475251933405095e-07, "loss": 1.1024, "step": 26967 }, { "epoch": 0.81, "learning_rate": 4.4738593874330743e-07, "loss": 1.1589, "step": 26968 }, { "epoch": 0.81, "learning_rate": 4.47246703686002e-07, "loss": 1.1387, "step": 26969 }, { "epoch": 0.81, "learning_rate": 4.4710748816991945e-07, "loss": 1.0789, "step": 26970 }, { "epoch": 0.81, "learning_rate": 4.4696829219638473e-07, "loss": 1.0017, "step": 26971 }, { "epoch": 0.81, "learning_rate": 4.4682911576672316e-07, "loss": 1.0539, "step": 26972 }, { "epoch": 0.81, "learning_rate": 4.466899588822604e-07, "loss": 1.0059, "step": 26973 }, { "epoch": 0.81, "learning_rate": 4.465508215443193e-07, "loss": 1.1957, "step": 26974 }, { "epoch": 0.81, "learning_rate": 4.4641170375422563e-07, "loss": 1.1277, "step": 26975 }, { "epoch": 0.81, "learning_rate": 4.4627260551330346e-07, "loss": 1.1609, "step": 26976 }, { "epoch": 0.81, "learning_rate": 4.4613352682287696e-07, "loss": 1.0602, "step": 26977 }, { "epoch": 0.81, "learning_rate": 4.459944676842709e-07, "loss": 1.101, "step": 26978 }, { "epoch": 0.81, "learning_rate": 4.4585542809880754e-07, "loss": 1.1329, "step": 26979 }, { "epoch": 0.81, "learning_rate": 4.457164080678111e-07, "loss": 1.2139, "step": 26980 }, { "epoch": 0.81, "learning_rate": 4.45577407592605e-07, "loss": 1.1497, "step": 26981 }, { "epoch": 0.81, "learning_rate": 4.4543842667451346e-07, "loss": 1.1351, "step": 26982 }, { "epoch": 0.81, "learning_rate": 4.452994653148579e-07, "loss": 1.0786, "step": 26983 }, { "epoch": 0.81, "learning_rate": 4.451605235149617e-07, "loss": 1.0556, "step": 26984 }, { "epoch": 0.81, "learning_rate": 4.450216012761477e-07, "loss": 1.0057, "step": 26985 }, { "epoch": 0.81, "learning_rate": 4.4488269859973897e-07, "loss": 1.1713, "step": 26986 }, { "epoch": 0.81, "learning_rate": 4.4474381548705646e-07, "loss": 1.0757, "step": 26987 }, { "epoch": 0.81, "learning_rate": 4.446049519394233e-07, "loss": 1.0864, "step": 26988 }, { "epoch": 0.81, "learning_rate": 4.4446610795816083e-07, "loss": 1.1102, "step": 26989 }, { "epoch": 0.81, "learning_rate": 4.443272835445911e-07, "loss": 1.0675, "step": 26990 }, { "epoch": 0.81, "learning_rate": 4.4418847870003614e-07, "loss": 1.1464, "step": 26991 }, { "epoch": 0.81, "learning_rate": 4.4404969342581623e-07, "loss": 1.0543, "step": 26992 }, { "epoch": 0.81, "learning_rate": 4.4391092772325283e-07, "loss": 1.0486, "step": 26993 }, { "epoch": 0.81, "learning_rate": 4.437721815936674e-07, "loss": 1.0999, "step": 26994 }, { "epoch": 0.81, "learning_rate": 4.436334550383803e-07, "loss": 1.0648, "step": 26995 }, { "epoch": 0.81, "learning_rate": 4.4349474805871265e-07, "loss": 1.0408, "step": 26996 }, { "epoch": 0.81, "learning_rate": 4.433560606559842e-07, "loss": 0.9823, "step": 26997 }, { "epoch": 0.81, "learning_rate": 4.432173928315156e-07, "loss": 1.1385, "step": 26998 }, { "epoch": 0.81, "learning_rate": 4.4307874458662777e-07, "loss": 1.269, "step": 26999 }, { "epoch": 0.81, "learning_rate": 4.4294011592263875e-07, "loss": 1.1118, "step": 27000 }, { "epoch": 0.81, "learning_rate": 4.428015068408692e-07, "loss": 1.1505, "step": 27001 }, { "epoch": 0.81, "learning_rate": 4.4266291734263834e-07, "loss": 1.0375, "step": 27002 }, { "epoch": 0.81, "learning_rate": 4.4252434742926594e-07, "loss": 1.1792, "step": 27003 }, { "epoch": 0.81, "learning_rate": 4.423857971020712e-07, "loss": 1.2328, "step": 27004 }, { "epoch": 0.81, "learning_rate": 4.4224726636237225e-07, "loss": 1.1528, "step": 27005 }, { "epoch": 0.81, "learning_rate": 4.4210875521148805e-07, "loss": 1.0798, "step": 27006 }, { "epoch": 0.81, "learning_rate": 4.4197026365073754e-07, "loss": 1.1119, "step": 27007 }, { "epoch": 0.81, "learning_rate": 4.418317916814396e-07, "loss": 1.0832, "step": 27008 }, { "epoch": 0.81, "learning_rate": 4.416933393049111e-07, "loss": 1.1408, "step": 27009 }, { "epoch": 0.81, "learning_rate": 4.415549065224709e-07, "loss": 1.2321, "step": 27010 }, { "epoch": 0.81, "learning_rate": 4.414164933354362e-07, "loss": 1.2134, "step": 27011 }, { "epoch": 0.81, "learning_rate": 4.41278099745126e-07, "loss": 1.1138, "step": 27012 }, { "epoch": 0.81, "learning_rate": 4.41139725752856e-07, "loss": 1.1254, "step": 27013 }, { "epoch": 0.81, "learning_rate": 4.4100137135994426e-07, "loss": 1.1276, "step": 27014 }, { "epoch": 0.81, "learning_rate": 4.4086303656770773e-07, "loss": 1.1044, "step": 27015 }, { "epoch": 0.81, "learning_rate": 4.4072472137746347e-07, "loss": 1.1011, "step": 27016 }, { "epoch": 0.81, "learning_rate": 4.4058642579052876e-07, "loss": 1.1229, "step": 27017 }, { "epoch": 0.81, "learning_rate": 4.404481498082186e-07, "loss": 1.1173, "step": 27018 }, { "epoch": 0.81, "learning_rate": 4.403098934318503e-07, "loss": 1.1015, "step": 27019 }, { "epoch": 0.81, "learning_rate": 4.4017165666273984e-07, "loss": 1.0784, "step": 27020 }, { "epoch": 0.81, "learning_rate": 4.400334395022032e-07, "loss": 1.071, "step": 27021 }, { "epoch": 0.81, "learning_rate": 4.398952419515559e-07, "loss": 1.008, "step": 27022 }, { "epoch": 0.81, "learning_rate": 4.3975706401211406e-07, "loss": 1.1263, "step": 27023 }, { "epoch": 0.81, "learning_rate": 4.396189056851924e-07, "loss": 1.1864, "step": 27024 }, { "epoch": 0.81, "learning_rate": 4.3948076697210714e-07, "loss": 1.1687, "step": 27025 }, { "epoch": 0.81, "learning_rate": 4.393426478741722e-07, "loss": 1.1165, "step": 27026 }, { "epoch": 0.81, "learning_rate": 4.3920454839270236e-07, "loss": 1.1138, "step": 27027 }, { "epoch": 0.81, "learning_rate": 4.39066468529013e-07, "loss": 1.0297, "step": 27028 }, { "epoch": 0.81, "learning_rate": 4.3892840828441833e-07, "loss": 1.0535, "step": 27029 }, { "epoch": 0.81, "learning_rate": 4.3879036766023315e-07, "loss": 1.0936, "step": 27030 }, { "epoch": 0.81, "learning_rate": 4.386523466577702e-07, "loss": 1.1849, "step": 27031 }, { "epoch": 0.81, "learning_rate": 4.3851434527834414e-07, "loss": 1.1535, "step": 27032 }, { "epoch": 0.81, "learning_rate": 4.3837636352326877e-07, "loss": 1.1644, "step": 27033 }, { "epoch": 0.81, "learning_rate": 4.3823840139385815e-07, "loss": 1.0534, "step": 27034 }, { "epoch": 0.81, "learning_rate": 4.381004588914245e-07, "loss": 1.1121, "step": 27035 }, { "epoch": 0.81, "learning_rate": 4.3796253601728125e-07, "loss": 1.2239, "step": 27036 }, { "epoch": 0.81, "learning_rate": 4.3782463277274144e-07, "loss": 1.1803, "step": 27037 }, { "epoch": 0.81, "learning_rate": 4.376867491591186e-07, "loss": 1.0832, "step": 27038 }, { "epoch": 0.81, "learning_rate": 4.3754888517772406e-07, "loss": 1.0711, "step": 27039 }, { "epoch": 0.81, "learning_rate": 4.3741104082987096e-07, "loss": 1.0601, "step": 27040 }, { "epoch": 0.81, "learning_rate": 4.3727321611687135e-07, "loss": 1.115, "step": 27041 }, { "epoch": 0.81, "learning_rate": 4.3713541104003775e-07, "loss": 1.058, "step": 27042 }, { "epoch": 0.81, "learning_rate": 4.369976256006811e-07, "loss": 1.1208, "step": 27043 }, { "epoch": 0.81, "learning_rate": 4.368598598001134e-07, "loss": 1.0795, "step": 27044 }, { "epoch": 0.81, "learning_rate": 4.36722113639646e-07, "loss": 1.196, "step": 27045 }, { "epoch": 0.81, "learning_rate": 4.365843871205905e-07, "loss": 1.0977, "step": 27046 }, { "epoch": 0.81, "learning_rate": 4.3644668024425793e-07, "loss": 1.0753, "step": 27047 }, { "epoch": 0.81, "learning_rate": 4.3630899301195907e-07, "loss": 1.0671, "step": 27048 }, { "epoch": 0.81, "learning_rate": 4.3617132542500467e-07, "loss": 1.1186, "step": 27049 }, { "epoch": 0.81, "learning_rate": 4.36033677484706e-07, "loss": 1.0723, "step": 27050 }, { "epoch": 0.81, "learning_rate": 4.358960491923719e-07, "loss": 1.0941, "step": 27051 }, { "epoch": 0.81, "learning_rate": 4.3575844054931345e-07, "loss": 1.0944, "step": 27052 }, { "epoch": 0.81, "learning_rate": 4.356208515568405e-07, "loss": 1.1443, "step": 27053 }, { "epoch": 0.82, "learning_rate": 4.3548328221626273e-07, "loss": 1.0264, "step": 27054 }, { "epoch": 0.82, "learning_rate": 4.353457325288904e-07, "loss": 1.189, "step": 27055 }, { "epoch": 0.82, "learning_rate": 4.3520820249603163e-07, "loss": 1.1103, "step": 27056 }, { "epoch": 0.82, "learning_rate": 4.350706921189965e-07, "loss": 1.0487, "step": 27057 }, { "epoch": 0.82, "learning_rate": 4.3493320139909393e-07, "loss": 1.0269, "step": 27058 }, { "epoch": 0.82, "learning_rate": 4.347957303376324e-07, "loss": 1.204, "step": 27059 }, { "epoch": 0.82, "learning_rate": 4.346582789359219e-07, "loss": 1.0586, "step": 27060 }, { "epoch": 0.82, "learning_rate": 4.345208471952689e-07, "loss": 1.188, "step": 27061 }, { "epoch": 0.82, "learning_rate": 4.343834351169829e-07, "loss": 1.1209, "step": 27062 }, { "epoch": 0.82, "learning_rate": 4.3424604270237174e-07, "loss": 1.0604, "step": 27063 }, { "epoch": 0.82, "learning_rate": 4.341086699527439e-07, "loss": 1.0864, "step": 27064 }, { "epoch": 0.82, "learning_rate": 4.3397131686940597e-07, "loss": 1.1166, "step": 27065 }, { "epoch": 0.82, "learning_rate": 4.338339834536659e-07, "loss": 0.9448, "step": 27066 }, { "epoch": 0.82, "learning_rate": 4.336966697068315e-07, "loss": 1.0906, "step": 27067 }, { "epoch": 0.82, "learning_rate": 4.3355937563021007e-07, "loss": 1.119, "step": 27068 }, { "epoch": 0.82, "learning_rate": 4.3342210122510745e-07, "loss": 1.1813, "step": 27069 }, { "epoch": 0.82, "learning_rate": 4.332848464928313e-07, "loss": 1.0589, "step": 27070 }, { "epoch": 0.82, "learning_rate": 4.3314761143468804e-07, "loss": 1.1098, "step": 27071 }, { "epoch": 0.82, "learning_rate": 4.330103960519841e-07, "loss": 1.1064, "step": 27072 }, { "epoch": 0.82, "learning_rate": 4.328732003460262e-07, "loss": 1.1564, "step": 27073 }, { "epoch": 0.82, "learning_rate": 4.3273602431811945e-07, "loss": 0.9699, "step": 27074 }, { "epoch": 0.82, "learning_rate": 4.3259886796957e-07, "loss": 0.9443, "step": 27075 }, { "epoch": 0.82, "learning_rate": 4.324617313016835e-07, "loss": 1.0331, "step": 27076 }, { "epoch": 0.82, "learning_rate": 4.323246143157656e-07, "loss": 1.0004, "step": 27077 }, { "epoch": 0.82, "learning_rate": 4.3218751701312176e-07, "loss": 1.1273, "step": 27078 }, { "epoch": 0.82, "learning_rate": 4.320504393950567e-07, "loss": 1.1094, "step": 27079 }, { "epoch": 0.82, "learning_rate": 4.319133814628754e-07, "loss": 1.1915, "step": 27080 }, { "epoch": 0.82, "learning_rate": 4.3177634321788344e-07, "loss": 1.1069, "step": 27081 }, { "epoch": 0.82, "learning_rate": 4.31639324661384e-07, "loss": 1.0731, "step": 27082 }, { "epoch": 0.82, "learning_rate": 4.315023257946821e-07, "loss": 1.0909, "step": 27083 }, { "epoch": 0.82, "learning_rate": 4.3136534661908175e-07, "loss": 1.0859, "step": 27084 }, { "epoch": 0.82, "learning_rate": 4.312283871358869e-07, "loss": 1.0506, "step": 27085 }, { "epoch": 0.82, "learning_rate": 4.310914473464023e-07, "loss": 1.0809, "step": 27086 }, { "epoch": 0.82, "learning_rate": 4.3095452725193e-07, "loss": 1.0547, "step": 27087 }, { "epoch": 0.82, "learning_rate": 4.308176268537739e-07, "loss": 1.1318, "step": 27088 }, { "epoch": 0.82, "learning_rate": 4.306807461532375e-07, "loss": 1.1456, "step": 27089 }, { "epoch": 0.82, "learning_rate": 4.305438851516247e-07, "loss": 0.9782, "step": 27090 }, { "epoch": 0.82, "learning_rate": 4.3040704385023666e-07, "loss": 0.9838, "step": 27091 }, { "epoch": 0.82, "learning_rate": 4.3027022225037655e-07, "loss": 1.1391, "step": 27092 }, { "epoch": 0.82, "learning_rate": 4.301334203533475e-07, "loss": 1.1516, "step": 27093 }, { "epoch": 0.82, "learning_rate": 4.2999663816045175e-07, "loss": 1.158, "step": 27094 }, { "epoch": 0.82, "learning_rate": 4.298598756729905e-07, "loss": 1.0255, "step": 27095 }, { "epoch": 0.82, "learning_rate": 4.297231328922663e-07, "loss": 1.0664, "step": 27096 }, { "epoch": 0.82, "learning_rate": 4.295864098195807e-07, "loss": 1.0786, "step": 27097 }, { "epoch": 0.82, "learning_rate": 4.2944970645623557e-07, "loss": 0.9858, "step": 27098 }, { "epoch": 0.82, "learning_rate": 4.293130228035322e-07, "loss": 1.1181, "step": 27099 }, { "epoch": 0.82, "learning_rate": 4.2917635886277146e-07, "loss": 1.2001, "step": 27100 }, { "epoch": 0.82, "learning_rate": 4.29039714635254e-07, "loss": 1.0974, "step": 27101 }, { "epoch": 0.82, "learning_rate": 4.2890309012228124e-07, "loss": 1.0214, "step": 27102 }, { "epoch": 0.82, "learning_rate": 4.2876648532515356e-07, "loss": 1.0841, "step": 27103 }, { "epoch": 0.82, "learning_rate": 4.2862990024517157e-07, "loss": 1.0984, "step": 27104 }, { "epoch": 0.82, "learning_rate": 4.284933348836351e-07, "loss": 1.0012, "step": 27105 }, { "epoch": 0.82, "learning_rate": 4.2835678924184443e-07, "loss": 1.1397, "step": 27106 }, { "epoch": 0.82, "learning_rate": 4.2822026332110024e-07, "loss": 1.019, "step": 27107 }, { "epoch": 0.82, "learning_rate": 4.2808375712270064e-07, "loss": 1.1047, "step": 27108 }, { "epoch": 0.82, "learning_rate": 4.2794727064794565e-07, "loss": 1.0671, "step": 27109 }, { "epoch": 0.82, "learning_rate": 4.278108038981346e-07, "loss": 1.0622, "step": 27110 }, { "epoch": 0.82, "learning_rate": 4.27674356874567e-07, "loss": 1.1036, "step": 27111 }, { "epoch": 0.82, "learning_rate": 4.27537929578542e-07, "loss": 1.228, "step": 27112 }, { "epoch": 0.82, "learning_rate": 4.27401522011357e-07, "loss": 1.1338, "step": 27113 }, { "epoch": 0.82, "learning_rate": 4.272651341743114e-07, "loss": 1.1777, "step": 27114 }, { "epoch": 0.82, "learning_rate": 4.2712876606870344e-07, "loss": 1.1267, "step": 27115 }, { "epoch": 0.82, "learning_rate": 4.2699241769583203e-07, "loss": 0.9857, "step": 27116 }, { "epoch": 0.82, "learning_rate": 4.2685608905699367e-07, "loss": 1.1601, "step": 27117 }, { "epoch": 0.82, "learning_rate": 4.2671978015348697e-07, "loss": 1.1301, "step": 27118 }, { "epoch": 0.82, "learning_rate": 4.2658349098660927e-07, "loss": 1.1014, "step": 27119 }, { "epoch": 0.82, "learning_rate": 4.26447221557659e-07, "loss": 1.1682, "step": 27120 }, { "epoch": 0.82, "learning_rate": 4.263109718679317e-07, "loss": 1.0314, "step": 27121 }, { "epoch": 0.82, "learning_rate": 4.261747419187254e-07, "loss": 1.122, "step": 27122 }, { "epoch": 0.82, "learning_rate": 4.260385317113366e-07, "loss": 1.1727, "step": 27123 }, { "epoch": 0.82, "learning_rate": 4.2590234124706224e-07, "loss": 1.0546, "step": 27124 }, { "epoch": 0.82, "learning_rate": 4.2576617052719925e-07, "loss": 1.0007, "step": 27125 }, { "epoch": 0.82, "learning_rate": 4.2563001955304274e-07, "loss": 1.0249, "step": 27126 }, { "epoch": 0.82, "learning_rate": 4.254938883258894e-07, "loss": 1.1091, "step": 27127 }, { "epoch": 0.82, "learning_rate": 4.2535777684703514e-07, "loss": 1.0764, "step": 27128 }, { "epoch": 0.82, "learning_rate": 4.2522168511777566e-07, "loss": 1.1454, "step": 27129 }, { "epoch": 0.82, "learning_rate": 4.250856131394063e-07, "loss": 1.2022, "step": 27130 }, { "epoch": 0.82, "learning_rate": 4.2494956091322285e-07, "loss": 1.1426, "step": 27131 }, { "epoch": 0.82, "learning_rate": 4.248135284405208e-07, "loss": 1.1206, "step": 27132 }, { "epoch": 0.82, "learning_rate": 4.246775157225938e-07, "loss": 1.1181, "step": 27133 }, { "epoch": 0.82, "learning_rate": 4.2454152276073716e-07, "loss": 1.0668, "step": 27134 }, { "epoch": 0.82, "learning_rate": 4.2440554955624603e-07, "loss": 1.003, "step": 27135 }, { "epoch": 0.82, "learning_rate": 4.24269596110414e-07, "loss": 1.1906, "step": 27136 }, { "epoch": 0.82, "learning_rate": 4.2413366242453595e-07, "loss": 1.1066, "step": 27137 }, { "epoch": 0.82, "learning_rate": 4.2399774849990637e-07, "loss": 1.0156, "step": 27138 }, { "epoch": 0.82, "learning_rate": 4.238618543378176e-07, "loss": 1.126, "step": 27139 }, { "epoch": 0.82, "learning_rate": 4.2372597993956433e-07, "loss": 1.1505, "step": 27140 }, { "epoch": 0.82, "learning_rate": 4.235901253064395e-07, "loss": 0.9897, "step": 27141 }, { "epoch": 0.82, "learning_rate": 4.2345429043973736e-07, "loss": 1.0466, "step": 27142 }, { "epoch": 0.82, "learning_rate": 4.233184753407496e-07, "loss": 1.1919, "step": 27143 }, { "epoch": 0.82, "learning_rate": 4.2318268001076996e-07, "loss": 1.1886, "step": 27144 }, { "epoch": 0.82, "learning_rate": 4.230469044510907e-07, "loss": 1.1035, "step": 27145 }, { "epoch": 0.82, "learning_rate": 4.229111486630055e-07, "loss": 1.1196, "step": 27146 }, { "epoch": 0.82, "learning_rate": 4.227754126478051e-07, "loss": 0.9929, "step": 27147 }, { "epoch": 0.82, "learning_rate": 4.226396964067822e-07, "loss": 0.9839, "step": 27148 }, { "epoch": 0.82, "learning_rate": 4.225039999412289e-07, "loss": 1.111, "step": 27149 }, { "epoch": 0.82, "learning_rate": 4.2236832325243725e-07, "loss": 1.0511, "step": 27150 }, { "epoch": 0.82, "learning_rate": 4.2223266634169894e-07, "loss": 1.1196, "step": 27151 }, { "epoch": 0.82, "learning_rate": 4.220970292103044e-07, "loss": 1.0779, "step": 27152 }, { "epoch": 0.82, "learning_rate": 4.2196141185954525e-07, "loss": 1.0248, "step": 27153 }, { "epoch": 0.82, "learning_rate": 4.218258142907128e-07, "loss": 1.1003, "step": 27154 }, { "epoch": 0.82, "learning_rate": 4.216902365050984e-07, "loss": 1.1252, "step": 27155 }, { "epoch": 0.82, "learning_rate": 4.2155467850399116e-07, "loss": 1.1118, "step": 27156 }, { "epoch": 0.82, "learning_rate": 4.2141914028868246e-07, "loss": 1.0788, "step": 27157 }, { "epoch": 0.82, "learning_rate": 4.212836218604627e-07, "loss": 1.2299, "step": 27158 }, { "epoch": 0.82, "learning_rate": 4.2114812322062133e-07, "loss": 1.1241, "step": 27159 }, { "epoch": 0.82, "learning_rate": 4.21012644370449e-07, "loss": 1.1095, "step": 27160 }, { "epoch": 0.82, "learning_rate": 4.208771853112348e-07, "loss": 1.1295, "step": 27161 }, { "epoch": 0.82, "learning_rate": 4.2074174604426835e-07, "loss": 1.2723, "step": 27162 }, { "epoch": 0.82, "learning_rate": 4.2060632657083934e-07, "loss": 1.0617, "step": 27163 }, { "epoch": 0.82, "learning_rate": 4.204709268922369e-07, "loss": 0.973, "step": 27164 }, { "epoch": 0.82, "learning_rate": 4.2033554700974947e-07, "loss": 1.116, "step": 27165 }, { "epoch": 0.82, "learning_rate": 4.202001869246658e-07, "loss": 1.1108, "step": 27166 }, { "epoch": 0.82, "learning_rate": 4.200648466382748e-07, "loss": 1.1685, "step": 27167 }, { "epoch": 0.82, "learning_rate": 4.199295261518652e-07, "loss": 1.0364, "step": 27168 }, { "epoch": 0.82, "learning_rate": 4.197942254667242e-07, "loss": 1.0461, "step": 27169 }, { "epoch": 0.82, "learning_rate": 4.1965894458414036e-07, "loss": 1.1354, "step": 27170 }, { "epoch": 0.82, "learning_rate": 4.1952368350540117e-07, "loss": 0.9888, "step": 27171 }, { "epoch": 0.82, "learning_rate": 4.1938844223179534e-07, "loss": 1.1194, "step": 27172 }, { "epoch": 0.82, "learning_rate": 4.192532207646091e-07, "loss": 1.0716, "step": 27173 }, { "epoch": 0.82, "learning_rate": 4.1911801910512973e-07, "loss": 0.9416, "step": 27174 }, { "epoch": 0.82, "learning_rate": 4.1898283725464476e-07, "loss": 1.0424, "step": 27175 }, { "epoch": 0.82, "learning_rate": 4.18847675214441e-07, "loss": 1.0499, "step": 27176 }, { "epoch": 0.82, "learning_rate": 4.1871253298580547e-07, "loss": 1.0367, "step": 27177 }, { "epoch": 0.82, "learning_rate": 4.185774105700238e-07, "loss": 1.119, "step": 27178 }, { "epoch": 0.82, "learning_rate": 4.1844230796838247e-07, "loss": 1.1487, "step": 27179 }, { "epoch": 0.82, "learning_rate": 4.183072251821682e-07, "loss": 1.1607, "step": 27180 }, { "epoch": 0.82, "learning_rate": 4.1817216221266694e-07, "loss": 1.0422, "step": 27181 }, { "epoch": 0.82, "learning_rate": 4.1803711906116375e-07, "loss": 1.0858, "step": 27182 }, { "epoch": 0.82, "learning_rate": 4.1790209572894425e-07, "loss": 1.1036, "step": 27183 }, { "epoch": 0.82, "learning_rate": 4.177670922172938e-07, "loss": 1.002, "step": 27184 }, { "epoch": 0.82, "learning_rate": 4.176321085274981e-07, "loss": 1.0524, "step": 27185 }, { "epoch": 0.82, "learning_rate": 4.1749714466084197e-07, "loss": 1.0755, "step": 27186 }, { "epoch": 0.82, "learning_rate": 4.173622006186098e-07, "loss": 1.0737, "step": 27187 }, { "epoch": 0.82, "learning_rate": 4.1722727640208654e-07, "loss": 1.0276, "step": 27188 }, { "epoch": 0.82, "learning_rate": 4.170923720125564e-07, "loss": 1.0167, "step": 27189 }, { "epoch": 0.82, "learning_rate": 4.169574874513044e-07, "loss": 1.1257, "step": 27190 }, { "epoch": 0.82, "learning_rate": 4.168226227196132e-07, "loss": 1.0867, "step": 27191 }, { "epoch": 0.82, "learning_rate": 4.166877778187675e-07, "loss": 1.174, "step": 27192 }, { "epoch": 0.82, "learning_rate": 4.165529527500506e-07, "loss": 0.9932, "step": 27193 }, { "epoch": 0.82, "learning_rate": 4.164181475147469e-07, "loss": 1.1373, "step": 27194 }, { "epoch": 0.82, "learning_rate": 4.162833621141385e-07, "loss": 1.1265, "step": 27195 }, { "epoch": 0.82, "learning_rate": 4.161485965495088e-07, "loss": 1.0965, "step": 27196 }, { "epoch": 0.82, "learning_rate": 4.1601385082214063e-07, "loss": 1.1298, "step": 27197 }, { "epoch": 0.82, "learning_rate": 4.1587912493331775e-07, "loss": 1.1588, "step": 27198 }, { "epoch": 0.82, "learning_rate": 4.1574441888432127e-07, "loss": 1.1644, "step": 27199 }, { "epoch": 0.82, "learning_rate": 4.156097326764338e-07, "loss": 1.1696, "step": 27200 }, { "epoch": 0.82, "learning_rate": 4.1547506631093834e-07, "loss": 1.1514, "step": 27201 }, { "epoch": 0.82, "learning_rate": 4.153404197891159e-07, "loss": 1.1045, "step": 27202 }, { "epoch": 0.82, "learning_rate": 4.152057931122494e-07, "loss": 1.0527, "step": 27203 }, { "epoch": 0.82, "learning_rate": 4.1507118628161896e-07, "loss": 1.0818, "step": 27204 }, { "epoch": 0.82, "learning_rate": 4.149365992985069e-07, "loss": 1.1552, "step": 27205 }, { "epoch": 0.82, "learning_rate": 4.1480203216419405e-07, "loss": 1.1291, "step": 27206 }, { "epoch": 0.82, "learning_rate": 4.146674848799623e-07, "loss": 1.0309, "step": 27207 }, { "epoch": 0.82, "learning_rate": 4.1453295744709107e-07, "loss": 1.064, "step": 27208 }, { "epoch": 0.82, "learning_rate": 4.1439844986686156e-07, "loss": 1.0745, "step": 27209 }, { "epoch": 0.82, "learning_rate": 4.1426396214055445e-07, "loss": 1.1539, "step": 27210 }, { "epoch": 0.82, "learning_rate": 4.1412949426945016e-07, "loss": 1.2448, "step": 27211 }, { "epoch": 0.82, "learning_rate": 4.139950462548281e-07, "loss": 1.0363, "step": 27212 }, { "epoch": 0.82, "learning_rate": 4.138606180979687e-07, "loss": 1.1435, "step": 27213 }, { "epoch": 0.82, "learning_rate": 4.137262098001521e-07, "loss": 1.1573, "step": 27214 }, { "epoch": 0.82, "learning_rate": 4.1359182136265665e-07, "loss": 1.1705, "step": 27215 }, { "epoch": 0.82, "learning_rate": 4.134574527867621e-07, "loss": 1.013, "step": 27216 }, { "epoch": 0.82, "learning_rate": 4.1332310407374786e-07, "loss": 1.1932, "step": 27217 }, { "epoch": 0.82, "learning_rate": 4.1318877522489255e-07, "loss": 1.2822, "step": 27218 }, { "epoch": 0.82, "learning_rate": 4.1305446624147513e-07, "loss": 1.0361, "step": 27219 }, { "epoch": 0.82, "learning_rate": 4.129201771247748e-07, "loss": 1.1974, "step": 27220 }, { "epoch": 0.82, "learning_rate": 4.127859078760685e-07, "loss": 1.1211, "step": 27221 }, { "epoch": 0.82, "learning_rate": 4.12651658496635e-07, "loss": 1.1622, "step": 27222 }, { "epoch": 0.82, "learning_rate": 4.125174289877526e-07, "loss": 1.1458, "step": 27223 }, { "epoch": 0.82, "learning_rate": 4.1238321935069935e-07, "loss": 1.1435, "step": 27224 }, { "epoch": 0.82, "learning_rate": 4.1224902958675177e-07, "loss": 1.1462, "step": 27225 }, { "epoch": 0.82, "learning_rate": 4.12114859697188e-07, "loss": 1.1698, "step": 27226 }, { "epoch": 0.82, "learning_rate": 4.119807096832854e-07, "loss": 1.0814, "step": 27227 }, { "epoch": 0.82, "learning_rate": 4.118465795463211e-07, "loss": 1.042, "step": 27228 }, { "epoch": 0.82, "learning_rate": 4.1171246928757153e-07, "loss": 1.142, "step": 27229 }, { "epoch": 0.82, "learning_rate": 4.1157837890831306e-07, "loss": 1.299, "step": 27230 }, { "epoch": 0.82, "learning_rate": 4.114443084098227e-07, "loss": 1.1469, "step": 27231 }, { "epoch": 0.82, "learning_rate": 4.1131025779337667e-07, "loss": 1.0613, "step": 27232 }, { "epoch": 0.82, "learning_rate": 4.1117622706025176e-07, "loss": 1.1192, "step": 27233 }, { "epoch": 0.82, "learning_rate": 4.110422162117225e-07, "loss": 1.0684, "step": 27234 }, { "epoch": 0.82, "learning_rate": 4.109082252490651e-07, "loss": 1.0757, "step": 27235 }, { "epoch": 0.82, "learning_rate": 4.1077425417355545e-07, "loss": 1.0445, "step": 27236 }, { "epoch": 0.82, "learning_rate": 4.106403029864692e-07, "loss": 1.1371, "step": 27237 }, { "epoch": 0.82, "learning_rate": 4.105063716890806e-07, "loss": 1.1046, "step": 27238 }, { "epoch": 0.82, "learning_rate": 4.1037246028266476e-07, "loss": 1.1334, "step": 27239 }, { "epoch": 0.82, "learning_rate": 4.102385687684968e-07, "loss": 1.0466, "step": 27240 }, { "epoch": 0.82, "learning_rate": 4.101046971478512e-07, "loss": 1.1721, "step": 27241 }, { "epoch": 0.82, "learning_rate": 4.099708454220022e-07, "loss": 1.1763, "step": 27242 }, { "epoch": 0.82, "learning_rate": 4.0983701359222414e-07, "loss": 1.1102, "step": 27243 }, { "epoch": 0.82, "learning_rate": 4.0970320165979127e-07, "loss": 1.1658, "step": 27244 }, { "epoch": 0.82, "learning_rate": 4.0956940962597726e-07, "loss": 1.0859, "step": 27245 }, { "epoch": 0.82, "learning_rate": 4.0943563749205604e-07, "loss": 1.029, "step": 27246 }, { "epoch": 0.82, "learning_rate": 4.093018852593003e-07, "loss": 1.2042, "step": 27247 }, { "epoch": 0.82, "learning_rate": 4.091681529289837e-07, "loss": 1.1036, "step": 27248 }, { "epoch": 0.82, "learning_rate": 4.090344405023791e-07, "loss": 1.1203, "step": 27249 }, { "epoch": 0.82, "learning_rate": 4.0890074798076026e-07, "loss": 1.2432, "step": 27250 }, { "epoch": 0.82, "learning_rate": 4.087670753653986e-07, "loss": 1.1016, "step": 27251 }, { "epoch": 0.82, "learning_rate": 4.0863342265756724e-07, "loss": 0.9697, "step": 27252 }, { "epoch": 0.82, "learning_rate": 4.0849978985853853e-07, "loss": 1.0797, "step": 27253 }, { "epoch": 0.82, "learning_rate": 4.0836617696958516e-07, "loss": 1.0789, "step": 27254 }, { "epoch": 0.82, "learning_rate": 4.0823258399197764e-07, "loss": 1.0188, "step": 27255 }, { "epoch": 0.82, "learning_rate": 4.0809901092698864e-07, "loss": 1.0656, "step": 27256 }, { "epoch": 0.82, "learning_rate": 4.0796545777588933e-07, "loss": 1.115, "step": 27257 }, { "epoch": 0.82, "learning_rate": 4.078319245399515e-07, "loss": 1.1968, "step": 27258 }, { "epoch": 0.82, "learning_rate": 4.0769841122044656e-07, "loss": 1.048, "step": 27259 }, { "epoch": 0.82, "learning_rate": 4.075649178186447e-07, "loss": 1.0458, "step": 27260 }, { "epoch": 0.82, "learning_rate": 4.0743144433581684e-07, "loss": 1.0073, "step": 27261 }, { "epoch": 0.82, "learning_rate": 4.0729799077323384e-07, "loss": 1.1761, "step": 27262 }, { "epoch": 0.82, "learning_rate": 4.0716455713216696e-07, "loss": 1.0452, "step": 27263 }, { "epoch": 0.82, "learning_rate": 4.0703114341388463e-07, "loss": 1.2622, "step": 27264 }, { "epoch": 0.82, "learning_rate": 4.06897749619658e-07, "loss": 1.0404, "step": 27265 }, { "epoch": 0.82, "learning_rate": 4.0676437575075665e-07, "loss": 1.0165, "step": 27266 }, { "epoch": 0.82, "learning_rate": 4.066310218084504e-07, "loss": 1.1597, "step": 27267 }, { "epoch": 0.82, "learning_rate": 4.0649768779400855e-07, "loss": 1.2313, "step": 27268 }, { "epoch": 0.82, "learning_rate": 4.063643737087003e-07, "loss": 1.051, "step": 27269 }, { "epoch": 0.82, "learning_rate": 4.062310795537952e-07, "loss": 1.0306, "step": 27270 }, { "epoch": 0.82, "learning_rate": 4.0609780533056143e-07, "loss": 1.1198, "step": 27271 }, { "epoch": 0.82, "learning_rate": 4.0596455104026907e-07, "loss": 1.1571, "step": 27272 }, { "epoch": 0.82, "learning_rate": 4.0583131668418487e-07, "loss": 1.1229, "step": 27273 }, { "epoch": 0.82, "learning_rate": 4.056981022635778e-07, "loss": 1.1238, "step": 27274 }, { "epoch": 0.82, "learning_rate": 4.055649077797164e-07, "loss": 1.0045, "step": 27275 }, { "epoch": 0.82, "learning_rate": 4.054317332338689e-07, "loss": 1.0676, "step": 27276 }, { "epoch": 0.82, "learning_rate": 4.05298578627302e-07, "loss": 1.1368, "step": 27277 }, { "epoch": 0.82, "learning_rate": 4.051654439612837e-07, "loss": 1.1428, "step": 27278 }, { "epoch": 0.82, "learning_rate": 4.050323292370814e-07, "loss": 1.0925, "step": 27279 }, { "epoch": 0.82, "learning_rate": 4.04899234455963e-07, "loss": 1.2127, "step": 27280 }, { "epoch": 0.82, "learning_rate": 4.047661596191943e-07, "loss": 1.1545, "step": 27281 }, { "epoch": 0.82, "learning_rate": 4.0463310472804274e-07, "loss": 1.0645, "step": 27282 }, { "epoch": 0.82, "learning_rate": 4.0450006978377477e-07, "loss": 1.1379, "step": 27283 }, { "epoch": 0.82, "learning_rate": 4.0436705478765686e-07, "loss": 1.0991, "step": 27284 }, { "epoch": 0.82, "learning_rate": 4.042340597409558e-07, "loss": 1.0224, "step": 27285 }, { "epoch": 0.82, "learning_rate": 4.041010846449367e-07, "loss": 1.1141, "step": 27286 }, { "epoch": 0.82, "learning_rate": 4.03968129500866e-07, "loss": 0.9696, "step": 27287 }, { "epoch": 0.82, "learning_rate": 4.0383519431000885e-07, "loss": 1.0662, "step": 27288 }, { "epoch": 0.82, "learning_rate": 4.0370227907363194e-07, "loss": 1.019, "step": 27289 }, { "epoch": 0.82, "learning_rate": 4.0356938379299907e-07, "loss": 1.0726, "step": 27290 }, { "epoch": 0.82, "learning_rate": 4.0343650846937616e-07, "loss": 1.1193, "step": 27291 }, { "epoch": 0.82, "learning_rate": 4.033036531040277e-07, "loss": 1.2072, "step": 27292 }, { "epoch": 0.82, "learning_rate": 4.031708176982188e-07, "loss": 1.2008, "step": 27293 }, { "epoch": 0.82, "learning_rate": 4.0303800225321377e-07, "loss": 1.0909, "step": 27294 }, { "epoch": 0.82, "learning_rate": 4.029052067702771e-07, "loss": 1.0766, "step": 27295 }, { "epoch": 0.82, "learning_rate": 4.0277243125067255e-07, "loss": 1.0428, "step": 27296 }, { "epoch": 0.82, "learning_rate": 4.0263967569566546e-07, "loss": 1.0815, "step": 27297 }, { "epoch": 0.82, "learning_rate": 4.0250694010651766e-07, "loss": 1.0214, "step": 27298 }, { "epoch": 0.82, "learning_rate": 4.023742244844936e-07, "loss": 1.1971, "step": 27299 }, { "epoch": 0.82, "learning_rate": 4.0224152883085675e-07, "loss": 1.1899, "step": 27300 }, { "epoch": 0.82, "learning_rate": 4.0210885314687034e-07, "loss": 1.073, "step": 27301 }, { "epoch": 0.82, "learning_rate": 4.019761974337977e-07, "loss": 1.0847, "step": 27302 }, { "epoch": 0.82, "learning_rate": 4.0184356169290064e-07, "loss": 1.103, "step": 27303 }, { "epoch": 0.82, "learning_rate": 4.017109459254426e-07, "loss": 1.1384, "step": 27304 }, { "epoch": 0.82, "learning_rate": 4.0157835013268556e-07, "loss": 0.9412, "step": 27305 }, { "epoch": 0.82, "learning_rate": 4.0144577431589253e-07, "loss": 1.0892, "step": 27306 }, { "epoch": 0.82, "learning_rate": 4.0131321847632465e-07, "loss": 1.1617, "step": 27307 }, { "epoch": 0.82, "learning_rate": 4.0118068261524395e-07, "loss": 1.0657, "step": 27308 }, { "epoch": 0.82, "learning_rate": 4.010481667339125e-07, "loss": 1.072, "step": 27309 }, { "epoch": 0.82, "learning_rate": 4.009156708335915e-07, "loss": 1.0613, "step": 27310 }, { "epoch": 0.82, "learning_rate": 4.00783194915543e-07, "loss": 1.1091, "step": 27311 }, { "epoch": 0.82, "learning_rate": 4.0065073898102684e-07, "loss": 1.121, "step": 27312 }, { "epoch": 0.82, "learning_rate": 4.005183030313045e-07, "loss": 1.0141, "step": 27313 }, { "epoch": 0.82, "learning_rate": 4.003858870676369e-07, "loss": 1.1611, "step": 27314 }, { "epoch": 0.82, "learning_rate": 4.00253491091285e-07, "loss": 1.1146, "step": 27315 }, { "epoch": 0.82, "learning_rate": 4.0012111510350783e-07, "loss": 1.0588, "step": 27316 }, { "epoch": 0.82, "learning_rate": 3.999887591055665e-07, "loss": 1.1449, "step": 27317 }, { "epoch": 0.82, "learning_rate": 3.998564230987209e-07, "loss": 1.1291, "step": 27318 }, { "epoch": 0.82, "learning_rate": 3.9972410708423113e-07, "loss": 1.2653, "step": 27319 }, { "epoch": 0.82, "learning_rate": 3.9959181106335563e-07, "loss": 1.0017, "step": 27320 }, { "epoch": 0.82, "learning_rate": 3.9945953503735454e-07, "loss": 1.0864, "step": 27321 }, { "epoch": 0.82, "learning_rate": 3.993272790074873e-07, "loss": 1.0697, "step": 27322 }, { "epoch": 0.82, "learning_rate": 3.991950429750124e-07, "loss": 0.999, "step": 27323 }, { "epoch": 0.82, "learning_rate": 3.9906282694118893e-07, "loss": 1.1578, "step": 27324 }, { "epoch": 0.82, "learning_rate": 3.9893063090727546e-07, "loss": 1.091, "step": 27325 }, { "epoch": 0.82, "learning_rate": 3.987984548745305e-07, "loss": 1.0379, "step": 27326 }, { "epoch": 0.82, "learning_rate": 3.986662988442122e-07, "loss": 1.0959, "step": 27327 }, { "epoch": 0.82, "learning_rate": 3.9853416281757957e-07, "loss": 0.989, "step": 27328 }, { "epoch": 0.82, "learning_rate": 3.984020467958888e-07, "loss": 1.0709, "step": 27329 }, { "epoch": 0.82, "learning_rate": 3.982699507803983e-07, "loss": 1.256, "step": 27330 }, { "epoch": 0.82, "learning_rate": 3.981378747723658e-07, "loss": 1.0571, "step": 27331 }, { "epoch": 0.82, "learning_rate": 3.98005818773049e-07, "loss": 0.9492, "step": 27332 }, { "epoch": 0.82, "learning_rate": 3.9787378278370396e-07, "loss": 1.0472, "step": 27333 }, { "epoch": 0.82, "learning_rate": 3.97741766805588e-07, "loss": 1.0968, "step": 27334 }, { "epoch": 0.82, "learning_rate": 3.976097708399579e-07, "loss": 1.0493, "step": 27335 }, { "epoch": 0.82, "learning_rate": 3.974777948880701e-07, "loss": 1.2698, "step": 27336 }, { "epoch": 0.82, "learning_rate": 3.9734583895118193e-07, "loss": 1.2038, "step": 27337 }, { "epoch": 0.82, "learning_rate": 3.97213903030548e-07, "loss": 1.0269, "step": 27338 }, { "epoch": 0.82, "learning_rate": 3.9708198712742506e-07, "loss": 1.0926, "step": 27339 }, { "epoch": 0.82, "learning_rate": 3.969500912430688e-07, "loss": 1.1036, "step": 27340 }, { "epoch": 0.82, "learning_rate": 3.9681821537873534e-07, "loss": 0.9789, "step": 27341 }, { "epoch": 0.82, "learning_rate": 3.9668635953567874e-07, "loss": 1.1027, "step": 27342 }, { "epoch": 0.82, "learning_rate": 3.9655452371515525e-07, "loss": 1.0975, "step": 27343 }, { "epoch": 0.82, "learning_rate": 3.9642270791841964e-07, "loss": 1.1046, "step": 27344 }, { "epoch": 0.82, "learning_rate": 3.962909121467273e-07, "loss": 0.9952, "step": 27345 }, { "epoch": 0.82, "learning_rate": 3.9615913640133174e-07, "loss": 1.0372, "step": 27346 }, { "epoch": 0.82, "learning_rate": 3.960273806834877e-07, "loss": 1.1703, "step": 27347 }, { "epoch": 0.82, "learning_rate": 3.958956449944501e-07, "loss": 1.1908, "step": 27348 }, { "epoch": 0.82, "learning_rate": 3.957639293354723e-07, "loss": 1.0561, "step": 27349 }, { "epoch": 0.82, "learning_rate": 3.9563223370780863e-07, "loss": 1.0046, "step": 27350 }, { "epoch": 0.82, "learning_rate": 3.955005581127125e-07, "loss": 1.0824, "step": 27351 }, { "epoch": 0.82, "learning_rate": 3.9536890255143736e-07, "loss": 1.1229, "step": 27352 }, { "epoch": 0.82, "learning_rate": 3.952372670252369e-07, "loss": 0.9752, "step": 27353 }, { "epoch": 0.82, "learning_rate": 3.9510565153536436e-07, "loss": 1.0977, "step": 27354 }, { "epoch": 0.82, "learning_rate": 3.949740560830717e-07, "loss": 1.0938, "step": 27355 }, { "epoch": 0.82, "learning_rate": 3.948424806696124e-07, "loss": 1.0573, "step": 27356 }, { "epoch": 0.82, "learning_rate": 3.947109252962386e-07, "loss": 1.1699, "step": 27357 }, { "epoch": 0.82, "learning_rate": 3.9457938996420337e-07, "loss": 1.1321, "step": 27358 }, { "epoch": 0.82, "learning_rate": 3.9444787467475794e-07, "loss": 1.1254, "step": 27359 }, { "epoch": 0.82, "learning_rate": 3.9431637942915464e-07, "loss": 0.9703, "step": 27360 }, { "epoch": 0.82, "learning_rate": 3.9418490422864527e-07, "loss": 1.0964, "step": 27361 }, { "epoch": 0.82, "learning_rate": 3.9405344907448154e-07, "loss": 1.1815, "step": 27362 }, { "epoch": 0.82, "learning_rate": 3.9392201396791505e-07, "loss": 1.132, "step": 27363 }, { "epoch": 0.82, "learning_rate": 3.937905989101962e-07, "loss": 1.1163, "step": 27364 }, { "epoch": 0.82, "learning_rate": 3.936592039025766e-07, "loss": 0.9436, "step": 27365 }, { "epoch": 0.82, "learning_rate": 3.935278289463068e-07, "loss": 1.0494, "step": 27366 }, { "epoch": 0.82, "learning_rate": 3.93396474042638e-07, "loss": 1.1963, "step": 27367 }, { "epoch": 0.82, "learning_rate": 3.9326513919281966e-07, "loss": 1.1931, "step": 27368 }, { "epoch": 0.82, "learning_rate": 3.931338243981028e-07, "loss": 1.1001, "step": 27369 }, { "epoch": 0.82, "learning_rate": 3.93002529659737e-07, "loss": 1.1544, "step": 27370 }, { "epoch": 0.82, "learning_rate": 3.9287125497897314e-07, "loss": 1.0791, "step": 27371 }, { "epoch": 0.82, "learning_rate": 3.927400003570592e-07, "loss": 1.053, "step": 27372 }, { "epoch": 0.82, "learning_rate": 3.92608765795246e-07, "loss": 1.0807, "step": 27373 }, { "epoch": 0.82, "learning_rate": 3.9247755129478207e-07, "loss": 1.1683, "step": 27374 }, { "epoch": 0.82, "learning_rate": 3.9234635685691693e-07, "loss": 1.0304, "step": 27375 }, { "epoch": 0.82, "learning_rate": 3.922151824828993e-07, "loss": 0.9793, "step": 27376 }, { "epoch": 0.82, "learning_rate": 3.92084028173978e-07, "loss": 1.109, "step": 27377 }, { "epoch": 0.82, "learning_rate": 3.919528939314016e-07, "loss": 1.0374, "step": 27378 }, { "epoch": 0.82, "learning_rate": 3.918217797564192e-07, "loss": 1.1514, "step": 27379 }, { "epoch": 0.82, "learning_rate": 3.9169068565027723e-07, "loss": 1.1039, "step": 27380 }, { "epoch": 0.82, "learning_rate": 3.915596116142245e-07, "loss": 1.057, "step": 27381 }, { "epoch": 0.82, "learning_rate": 3.914285576495089e-07, "loss": 1.1159, "step": 27382 }, { "epoch": 0.82, "learning_rate": 3.9129752375737793e-07, "loss": 1.1324, "step": 27383 }, { "epoch": 0.82, "learning_rate": 3.911665099390796e-07, "loss": 1.0893, "step": 27384 }, { "epoch": 0.82, "learning_rate": 3.910355161958598e-07, "loss": 1.0991, "step": 27385 }, { "epoch": 0.83, "learning_rate": 3.909045425289662e-07, "loss": 1.1379, "step": 27386 }, { "epoch": 0.83, "learning_rate": 3.907735889396455e-07, "loss": 1.0778, "step": 27387 }, { "epoch": 0.83, "learning_rate": 3.9064265542914454e-07, "loss": 1.1401, "step": 27388 }, { "epoch": 0.83, "learning_rate": 3.9051174199871006e-07, "loss": 1.0768, "step": 27389 }, { "epoch": 0.83, "learning_rate": 3.903808486495872e-07, "loss": 0.9953, "step": 27390 }, { "epoch": 0.83, "learning_rate": 3.9024997538302275e-07, "loss": 1.1602, "step": 27391 }, { "epoch": 0.83, "learning_rate": 3.901191222002623e-07, "loss": 1.1457, "step": 27392 }, { "epoch": 0.83, "learning_rate": 3.899882891025525e-07, "loss": 1.069, "step": 27393 }, { "epoch": 0.83, "learning_rate": 3.898574760911372e-07, "loss": 1.0951, "step": 27394 }, { "epoch": 0.83, "learning_rate": 3.8972668316726245e-07, "loss": 1.0914, "step": 27395 }, { "epoch": 0.83, "learning_rate": 3.895959103321734e-07, "loss": 1.0143, "step": 27396 }, { "epoch": 0.83, "learning_rate": 3.894651575871153e-07, "loss": 1.1062, "step": 27397 }, { "epoch": 0.83, "learning_rate": 3.8933442493333196e-07, "loss": 1.1695, "step": 27398 }, { "epoch": 0.83, "learning_rate": 3.892037123720685e-07, "loss": 1.1725, "step": 27399 }, { "epoch": 0.83, "learning_rate": 3.890730199045689e-07, "loss": 1.0029, "step": 27400 }, { "epoch": 0.83, "learning_rate": 3.8894234753207807e-07, "loss": 1.0616, "step": 27401 }, { "epoch": 0.83, "learning_rate": 3.8881169525583906e-07, "loss": 1.1318, "step": 27402 }, { "epoch": 0.83, "learning_rate": 3.8868106307709567e-07, "loss": 1.071, "step": 27403 }, { "epoch": 0.83, "learning_rate": 3.885504509970917e-07, "loss": 1.1041, "step": 27404 }, { "epoch": 0.83, "learning_rate": 3.884198590170707e-07, "loss": 1.0677, "step": 27405 }, { "epoch": 0.83, "learning_rate": 3.8828928713827543e-07, "loss": 1.2255, "step": 27406 }, { "epoch": 0.83, "learning_rate": 3.8815873536194927e-07, "loss": 1.0226, "step": 27407 }, { "epoch": 0.83, "learning_rate": 3.8802820368933485e-07, "loss": 1.1488, "step": 27408 }, { "epoch": 0.83, "learning_rate": 3.878976921216748e-07, "loss": 1.0491, "step": 27409 }, { "epoch": 0.83, "learning_rate": 3.8776720066021204e-07, "loss": 1.1945, "step": 27410 }, { "epoch": 0.83, "learning_rate": 3.876367293061878e-07, "loss": 1.0848, "step": 27411 }, { "epoch": 0.83, "learning_rate": 3.8750627806084434e-07, "loss": 1.1913, "step": 27412 }, { "epoch": 0.83, "learning_rate": 3.8737584692542377e-07, "loss": 1.1313, "step": 27413 }, { "epoch": 0.83, "learning_rate": 3.872454359011682e-07, "loss": 1.0964, "step": 27414 }, { "epoch": 0.83, "learning_rate": 3.87115044989318e-07, "loss": 1.0021, "step": 27415 }, { "epoch": 0.83, "learning_rate": 3.8698467419111515e-07, "loss": 1.0329, "step": 27416 }, { "epoch": 0.83, "learning_rate": 3.868543235078004e-07, "loss": 1.1376, "step": 27417 }, { "epoch": 0.83, "learning_rate": 3.8672399294061467e-07, "loss": 1.1931, "step": 27418 }, { "epoch": 0.83, "learning_rate": 3.8659368249079925e-07, "loss": 0.9695, "step": 27419 }, { "epoch": 0.83, "learning_rate": 3.8646339215959366e-07, "loss": 1.0198, "step": 27420 }, { "epoch": 0.83, "learning_rate": 3.8633312194823886e-07, "loss": 1.0307, "step": 27421 }, { "epoch": 0.83, "learning_rate": 3.862028718579744e-07, "loss": 1.0692, "step": 27422 }, { "epoch": 0.83, "learning_rate": 3.8607264189004154e-07, "loss": 1.0655, "step": 27423 }, { "epoch": 0.83, "learning_rate": 3.859424320456781e-07, "loss": 1.0598, "step": 27424 }, { "epoch": 0.83, "learning_rate": 3.858122423261246e-07, "loss": 1.084, "step": 27425 }, { "epoch": 0.83, "learning_rate": 3.856820727326205e-07, "loss": 1.0926, "step": 27426 }, { "epoch": 0.83, "learning_rate": 3.855519232664051e-07, "loss": 1.1, "step": 27427 }, { "epoch": 0.83, "learning_rate": 3.8542179392871663e-07, "loss": 1.0935, "step": 27428 }, { "epoch": 0.83, "learning_rate": 3.852916847207944e-07, "loss": 1.1529, "step": 27429 }, { "epoch": 0.83, "learning_rate": 3.851615956438767e-07, "loss": 1.056, "step": 27430 }, { "epoch": 0.83, "learning_rate": 3.850315266992019e-07, "loss": 1.1932, "step": 27431 }, { "epoch": 0.83, "learning_rate": 3.849014778880086e-07, "loss": 1.069, "step": 27432 }, { "epoch": 0.83, "learning_rate": 3.8477144921153455e-07, "loss": 1.1639, "step": 27433 }, { "epoch": 0.83, "learning_rate": 3.846414406710175e-07, "loss": 0.9882, "step": 27434 }, { "epoch": 0.83, "learning_rate": 3.8451145226769515e-07, "loss": 1.0605, "step": 27435 }, { "epoch": 0.83, "learning_rate": 3.843814840028054e-07, "loss": 1.0812, "step": 27436 }, { "epoch": 0.83, "learning_rate": 3.8425153587758445e-07, "loss": 1.0087, "step": 27437 }, { "epoch": 0.83, "learning_rate": 3.8412160789327023e-07, "loss": 1.0624, "step": 27438 }, { "epoch": 0.83, "learning_rate": 3.8399170005109897e-07, "loss": 0.9762, "step": 27439 }, { "epoch": 0.83, "learning_rate": 3.8386181235230827e-07, "loss": 1.0531, "step": 27440 }, { "epoch": 0.83, "learning_rate": 3.837319447981333e-07, "loss": 0.9894, "step": 27441 }, { "epoch": 0.83, "learning_rate": 3.836020973898111e-07, "loss": 1.1172, "step": 27442 }, { "epoch": 0.83, "learning_rate": 3.834722701285776e-07, "loss": 1.0142, "step": 27443 }, { "epoch": 0.83, "learning_rate": 3.8334246301566845e-07, "loss": 1.0043, "step": 27444 }, { "epoch": 0.83, "learning_rate": 3.8321267605232056e-07, "loss": 1.0606, "step": 27445 }, { "epoch": 0.83, "learning_rate": 3.830829092397678e-07, "loss": 1.0513, "step": 27446 }, { "epoch": 0.83, "learning_rate": 3.8295316257924624e-07, "loss": 1.1812, "step": 27447 }, { "epoch": 0.83, "learning_rate": 3.82823436071991e-07, "loss": 1.1742, "step": 27448 }, { "epoch": 0.83, "learning_rate": 3.826937297192376e-07, "loss": 1.1572, "step": 27449 }, { "epoch": 0.83, "learning_rate": 3.8256404352221943e-07, "loss": 1.0312, "step": 27450 }, { "epoch": 0.83, "learning_rate": 3.8243437748217204e-07, "loss": 1.0516, "step": 27451 }, { "epoch": 0.83, "learning_rate": 3.8230473160032924e-07, "loss": 1.0876, "step": 27452 }, { "epoch": 0.83, "learning_rate": 3.8217510587792607e-07, "loss": 1.0442, "step": 27453 }, { "epoch": 0.83, "learning_rate": 3.820455003161955e-07, "loss": 1.121, "step": 27454 }, { "epoch": 0.83, "learning_rate": 3.819159149163718e-07, "loss": 1.1812, "step": 27455 }, { "epoch": 0.83, "learning_rate": 3.8178634967968806e-07, "loss": 1.2131, "step": 27456 }, { "epoch": 0.83, "learning_rate": 3.8165680460737847e-07, "loss": 1.1483, "step": 27457 }, { "epoch": 0.83, "learning_rate": 3.815272797006758e-07, "loss": 1.0958, "step": 27458 }, { "epoch": 0.83, "learning_rate": 3.81397774960813e-07, "loss": 1.0175, "step": 27459 }, { "epoch": 0.83, "learning_rate": 3.812682903890233e-07, "loss": 1.1742, "step": 27460 }, { "epoch": 0.83, "learning_rate": 3.811388259865395e-07, "loss": 1.1319, "step": 27461 }, { "epoch": 0.83, "learning_rate": 3.810093817545929e-07, "loss": 1.1051, "step": 27462 }, { "epoch": 0.83, "learning_rate": 3.808799576944167e-07, "loss": 0.9418, "step": 27463 }, { "epoch": 0.83, "learning_rate": 3.807505538072426e-07, "loss": 1.1407, "step": 27464 }, { "epoch": 0.83, "learning_rate": 3.8062117009430244e-07, "loss": 1.1158, "step": 27465 }, { "epoch": 0.83, "learning_rate": 3.804918065568286e-07, "loss": 1.1055, "step": 27466 }, { "epoch": 0.83, "learning_rate": 3.803624631960515e-07, "loss": 1.0046, "step": 27467 }, { "epoch": 0.83, "learning_rate": 3.8023314001320283e-07, "loss": 1.0786, "step": 27468 }, { "epoch": 0.83, "learning_rate": 3.8010383700951363e-07, "loss": 0.9332, "step": 27469 }, { "epoch": 0.83, "learning_rate": 3.7997455418621515e-07, "loss": 1.0818, "step": 27470 }, { "epoch": 0.83, "learning_rate": 3.798452915445383e-07, "loss": 0.9999, "step": 27471 }, { "epoch": 0.83, "learning_rate": 3.7971604908571267e-07, "loss": 1.1689, "step": 27472 }, { "epoch": 0.83, "learning_rate": 3.7958682681096925e-07, "loss": 1.0395, "step": 27473 }, { "epoch": 0.83, "learning_rate": 3.7945762472153786e-07, "loss": 1.1279, "step": 27474 }, { "epoch": 0.83, "learning_rate": 3.7932844281864915e-07, "loss": 1.0469, "step": 27475 }, { "epoch": 0.83, "learning_rate": 3.7919928110353167e-07, "loss": 1.1664, "step": 27476 }, { "epoch": 0.83, "learning_rate": 3.7907013957741574e-07, "loss": 1.1243, "step": 27477 }, { "epoch": 0.83, "learning_rate": 3.789410182415304e-07, "loss": 1.0619, "step": 27478 }, { "epoch": 0.83, "learning_rate": 3.7881191709710577e-07, "loss": 1.0303, "step": 27479 }, { "epoch": 0.83, "learning_rate": 3.7868283614536956e-07, "loss": 1.1453, "step": 27480 }, { "epoch": 0.83, "learning_rate": 3.7855377538755124e-07, "loss": 1.2092, "step": 27481 }, { "epoch": 0.83, "learning_rate": 3.78424734824879e-07, "loss": 1.03, "step": 27482 }, { "epoch": 0.83, "learning_rate": 3.7829571445858137e-07, "loss": 1.1383, "step": 27483 }, { "epoch": 0.83, "learning_rate": 3.781667142898876e-07, "loss": 1.087, "step": 27484 }, { "epoch": 0.83, "learning_rate": 3.780377343200239e-07, "loss": 1.1016, "step": 27485 }, { "epoch": 0.83, "learning_rate": 3.779087745502194e-07, "loss": 1.1528, "step": 27486 }, { "epoch": 0.83, "learning_rate": 3.7777983498170104e-07, "loss": 1.1555, "step": 27487 }, { "epoch": 0.83, "learning_rate": 3.7765091561569653e-07, "loss": 1.1382, "step": 27488 }, { "epoch": 0.83, "learning_rate": 3.775220164534332e-07, "loss": 1.1442, "step": 27489 }, { "epoch": 0.83, "learning_rate": 3.7739313749613813e-07, "loss": 1.0607, "step": 27490 }, { "epoch": 0.83, "learning_rate": 3.7726427874503815e-07, "loss": 1.0793, "step": 27491 }, { "epoch": 0.83, "learning_rate": 3.7713544020136025e-07, "loss": 1.0649, "step": 27492 }, { "epoch": 0.83, "learning_rate": 3.7700662186633014e-07, "loss": 1.129, "step": 27493 }, { "epoch": 0.83, "learning_rate": 3.7687782374117465e-07, "loss": 1.0748, "step": 27494 }, { "epoch": 0.83, "learning_rate": 3.767490458271195e-07, "loss": 1.2014, "step": 27495 }, { "epoch": 0.83, "learning_rate": 3.766202881253908e-07, "loss": 0.9747, "step": 27496 }, { "epoch": 0.83, "learning_rate": 3.764915506372152e-07, "loss": 1.0609, "step": 27497 }, { "epoch": 0.83, "learning_rate": 3.763628333638164e-07, "loss": 1.114, "step": 27498 }, { "epoch": 0.83, "learning_rate": 3.7623413630642094e-07, "loss": 1.0335, "step": 27499 }, { "epoch": 0.83, "learning_rate": 3.761054594662533e-07, "loss": 1.0054, "step": 27500 }, { "epoch": 0.83, "learning_rate": 3.7597680284453987e-07, "loss": 1.1264, "step": 27501 }, { "epoch": 0.83, "learning_rate": 3.7584816644250344e-07, "loss": 1.1147, "step": 27502 }, { "epoch": 0.83, "learning_rate": 3.757195502613692e-07, "loss": 0.9855, "step": 27503 }, { "epoch": 0.83, "learning_rate": 3.7559095430236224e-07, "loss": 1.1613, "step": 27504 }, { "epoch": 0.83, "learning_rate": 3.754623785667064e-07, "loss": 1.1788, "step": 27505 }, { "epoch": 0.83, "learning_rate": 3.7533382305562525e-07, "loss": 1.1071, "step": 27506 }, { "epoch": 0.83, "learning_rate": 3.7520528777034273e-07, "loss": 1.1696, "step": 27507 }, { "epoch": 0.83, "learning_rate": 3.750767727120824e-07, "loss": 1.111, "step": 27508 }, { "epoch": 0.83, "learning_rate": 3.7494827788206787e-07, "loss": 1.0086, "step": 27509 }, { "epoch": 0.83, "learning_rate": 3.748198032815228e-07, "loss": 1.1404, "step": 27510 }, { "epoch": 0.83, "learning_rate": 3.7469134891166934e-07, "loss": 1.1038, "step": 27511 }, { "epoch": 0.83, "learning_rate": 3.7456291477373037e-07, "loss": 1.2053, "step": 27512 }, { "epoch": 0.83, "learning_rate": 3.7443450086892903e-07, "loss": 1.028, "step": 27513 }, { "epoch": 0.83, "learning_rate": 3.7430610719848744e-07, "loss": 1.0024, "step": 27514 }, { "epoch": 0.83, "learning_rate": 3.741777337636279e-07, "loss": 1.0785, "step": 27515 }, { "epoch": 0.83, "learning_rate": 3.7404938056557233e-07, "loss": 1.0422, "step": 27516 }, { "epoch": 0.83, "learning_rate": 3.73921047605543e-07, "loss": 1.1804, "step": 27517 }, { "epoch": 0.83, "learning_rate": 3.73792734884762e-07, "loss": 1.0828, "step": 27518 }, { "epoch": 0.83, "learning_rate": 3.7366444240444944e-07, "loss": 1.1715, "step": 27519 }, { "epoch": 0.83, "learning_rate": 3.7353617016582716e-07, "loss": 1.0444, "step": 27520 }, { "epoch": 0.83, "learning_rate": 3.734079181701167e-07, "loss": 1.0839, "step": 27521 }, { "epoch": 0.83, "learning_rate": 3.732796864185384e-07, "loss": 1.078, "step": 27522 }, { "epoch": 0.83, "learning_rate": 3.731514749123141e-07, "loss": 1.1244, "step": 27523 }, { "epoch": 0.83, "learning_rate": 3.730232836526626e-07, "loss": 1.1219, "step": 27524 }, { "epoch": 0.83, "learning_rate": 3.7289511264080506e-07, "loss": 1.0381, "step": 27525 }, { "epoch": 0.83, "learning_rate": 3.727669618779617e-07, "loss": 1.2112, "step": 27526 }, { "epoch": 0.83, "learning_rate": 3.726388313653528e-07, "loss": 1.1651, "step": 27527 }, { "epoch": 0.83, "learning_rate": 3.725107211041973e-07, "loss": 1.0153, "step": 27528 }, { "epoch": 0.83, "learning_rate": 3.723826310957149e-07, "loss": 1.0403, "step": 27529 }, { "epoch": 0.83, "learning_rate": 3.722545613411252e-07, "loss": 1.1567, "step": 27530 }, { "epoch": 0.83, "learning_rate": 3.7212651184164813e-07, "loss": 1.1127, "step": 27531 }, { "epoch": 0.83, "learning_rate": 3.71998482598501e-07, "loss": 1.1257, "step": 27532 }, { "epoch": 0.83, "learning_rate": 3.7187047361290365e-07, "loss": 1.1371, "step": 27533 }, { "epoch": 0.83, "learning_rate": 3.71742484886074e-07, "loss": 0.9801, "step": 27534 }, { "epoch": 0.83, "learning_rate": 3.716145164192314e-07, "loss": 1.1563, "step": 27535 }, { "epoch": 0.83, "learning_rate": 3.7148656821359375e-07, "loss": 1.2405, "step": 27536 }, { "epoch": 0.83, "learning_rate": 3.7135864027037837e-07, "loss": 1.1964, "step": 27537 }, { "epoch": 0.83, "learning_rate": 3.7123073259080376e-07, "loss": 1.0419, "step": 27538 }, { "epoch": 0.83, "learning_rate": 3.71102845176087e-07, "loss": 1.0913, "step": 27539 }, { "epoch": 0.83, "learning_rate": 3.7097497802744604e-07, "loss": 1.0526, "step": 27540 }, { "epoch": 0.83, "learning_rate": 3.7084713114609787e-07, "loss": 1.1398, "step": 27541 }, { "epoch": 0.83, "learning_rate": 3.7071930453325964e-07, "loss": 1.076, "step": 27542 }, { "epoch": 0.83, "learning_rate": 3.7059149819014817e-07, "loss": 1.0639, "step": 27543 }, { "epoch": 0.83, "learning_rate": 3.704637121179805e-07, "loss": 1.0084, "step": 27544 }, { "epoch": 0.83, "learning_rate": 3.7033594631797233e-07, "loss": 1.0365, "step": 27545 }, { "epoch": 0.83, "learning_rate": 3.702082007913399e-07, "loss": 1.0719, "step": 27546 }, { "epoch": 0.83, "learning_rate": 3.700804755393e-07, "loss": 1.2042, "step": 27547 }, { "epoch": 0.83, "learning_rate": 3.699527705630679e-07, "loss": 1.1328, "step": 27548 }, { "epoch": 0.83, "learning_rate": 3.6982508586386024e-07, "loss": 1.103, "step": 27549 }, { "epoch": 0.83, "learning_rate": 3.696974214428914e-07, "loss": 1.0133, "step": 27550 }, { "epoch": 0.83, "learning_rate": 3.6956977730137705e-07, "loss": 1.0815, "step": 27551 }, { "epoch": 0.83, "learning_rate": 3.694421534405321e-07, "loss": 1.0174, "step": 27552 }, { "epoch": 0.83, "learning_rate": 3.6931454986157274e-07, "loss": 1.1066, "step": 27553 }, { "epoch": 0.83, "learning_rate": 3.691869665657119e-07, "loss": 1.1122, "step": 27554 }, { "epoch": 0.83, "learning_rate": 3.6905940355416474e-07, "loss": 1.1871, "step": 27555 }, { "epoch": 0.83, "learning_rate": 3.6893186082814616e-07, "loss": 1.1128, "step": 27556 }, { "epoch": 0.83, "learning_rate": 3.688043383888701e-07, "loss": 0.9984, "step": 27557 }, { "epoch": 0.83, "learning_rate": 3.686768362375498e-07, "loss": 1.0746, "step": 27558 }, { "epoch": 0.83, "learning_rate": 3.6854935437539985e-07, "loss": 1.0496, "step": 27559 }, { "epoch": 0.83, "learning_rate": 3.6842189280363314e-07, "loss": 1.1315, "step": 27560 }, { "epoch": 0.83, "learning_rate": 3.6829445152346347e-07, "loss": 1.1049, "step": 27561 }, { "epoch": 0.83, "learning_rate": 3.6816703053610485e-07, "loss": 1.0498, "step": 27562 }, { "epoch": 0.83, "learning_rate": 3.6803962984276854e-07, "loss": 1.0449, "step": 27563 }, { "epoch": 0.83, "learning_rate": 3.6791224944466823e-07, "loss": 1.0923, "step": 27564 }, { "epoch": 0.83, "learning_rate": 3.677848893430164e-07, "loss": 1.054, "step": 27565 }, { "epoch": 0.83, "learning_rate": 3.676575495390261e-07, "loss": 1.0634, "step": 27566 }, { "epoch": 0.83, "learning_rate": 3.675302300339084e-07, "loss": 1.1696, "step": 27567 }, { "epoch": 0.83, "learning_rate": 3.674029308288757e-07, "loss": 1.1508, "step": 27568 }, { "epoch": 0.83, "learning_rate": 3.6727565192514023e-07, "loss": 1.1071, "step": 27569 }, { "epoch": 0.83, "learning_rate": 3.671483933239134e-07, "loss": 1.0142, "step": 27570 }, { "epoch": 0.83, "learning_rate": 3.670211550264066e-07, "loss": 1.1508, "step": 27571 }, { "epoch": 0.83, "learning_rate": 3.668939370338312e-07, "loss": 1.182, "step": 27572 }, { "epoch": 0.83, "learning_rate": 3.667667393473981e-07, "loss": 1.269, "step": 27573 }, { "epoch": 0.83, "learning_rate": 3.66639561968318e-07, "loss": 1.2289, "step": 27574 }, { "epoch": 0.83, "learning_rate": 3.665124048978028e-07, "loss": 1.1172, "step": 27575 }, { "epoch": 0.83, "learning_rate": 3.663852681370611e-07, "loss": 1.0842, "step": 27576 }, { "epoch": 0.83, "learning_rate": 3.6625815168730425e-07, "loss": 1.114, "step": 27577 }, { "epoch": 0.83, "learning_rate": 3.6613105554974214e-07, "loss": 1.085, "step": 27578 }, { "epoch": 0.83, "learning_rate": 3.6600397972558515e-07, "loss": 1.0635, "step": 27579 }, { "epoch": 0.83, "learning_rate": 3.6587692421604206e-07, "loss": 1.0394, "step": 27580 }, { "epoch": 0.83, "learning_rate": 3.657498890223227e-07, "loss": 1.1406, "step": 27581 }, { "epoch": 0.83, "learning_rate": 3.6562287414563663e-07, "loss": 1.0965, "step": 27582 }, { "epoch": 0.83, "learning_rate": 3.654958795871932e-07, "loss": 1.0507, "step": 27583 }, { "epoch": 0.83, "learning_rate": 3.653689053482007e-07, "loss": 1.1315, "step": 27584 }, { "epoch": 0.83, "learning_rate": 3.65241951429868e-07, "loss": 1.068, "step": 27585 }, { "epoch": 0.83, "learning_rate": 3.651150178334037e-07, "loss": 1.035, "step": 27586 }, { "epoch": 0.83, "learning_rate": 3.6498810456001704e-07, "loss": 1.1601, "step": 27587 }, { "epoch": 0.83, "learning_rate": 3.6486121161091457e-07, "loss": 1.157, "step": 27588 }, { "epoch": 0.83, "learning_rate": 3.6473433898730507e-07, "loss": 1.0951, "step": 27589 }, { "epoch": 0.83, "learning_rate": 3.6460748669039646e-07, "loss": 1.0934, "step": 27590 }, { "epoch": 0.83, "learning_rate": 3.644806547213958e-07, "loss": 1.1466, "step": 27591 }, { "epoch": 0.83, "learning_rate": 3.643538430815116e-07, "loss": 1.1773, "step": 27592 }, { "epoch": 0.83, "learning_rate": 3.6422705177194985e-07, "loss": 1.1052, "step": 27593 }, { "epoch": 0.83, "learning_rate": 3.6410028079391784e-07, "loss": 1.1328, "step": 27594 }, { "epoch": 0.83, "learning_rate": 3.639735301486222e-07, "loss": 1.1397, "step": 27595 }, { "epoch": 0.83, "learning_rate": 3.638467998372702e-07, "loss": 0.9839, "step": 27596 }, { "epoch": 0.83, "learning_rate": 3.637200898610677e-07, "loss": 1.0938, "step": 27597 }, { "epoch": 0.83, "learning_rate": 3.63593400221221e-07, "loss": 1.1569, "step": 27598 }, { "epoch": 0.83, "learning_rate": 3.6346673091893605e-07, "loss": 1.0601, "step": 27599 }, { "epoch": 0.83, "learning_rate": 3.6334008195541976e-07, "loss": 1.0954, "step": 27600 }, { "epoch": 0.83, "learning_rate": 3.6321345333187594e-07, "loss": 0.9999, "step": 27601 }, { "epoch": 0.83, "learning_rate": 3.630868450495112e-07, "loss": 1.142, "step": 27602 }, { "epoch": 0.83, "learning_rate": 3.629602571095303e-07, "loss": 1.0048, "step": 27603 }, { "epoch": 0.83, "learning_rate": 3.6283368951313877e-07, "loss": 1.2035, "step": 27604 }, { "epoch": 0.83, "learning_rate": 3.6270714226154165e-07, "loss": 1.0302, "step": 27605 }, { "epoch": 0.83, "learning_rate": 3.6258061535594274e-07, "loss": 1.0896, "step": 27606 }, { "epoch": 0.83, "learning_rate": 3.624541087975467e-07, "loss": 1.0491, "step": 27607 }, { "epoch": 0.83, "learning_rate": 3.6232762258755827e-07, "loss": 1.1362, "step": 27608 }, { "epoch": 0.83, "learning_rate": 3.6220115672718187e-07, "loss": 1.0273, "step": 27609 }, { "epoch": 0.83, "learning_rate": 3.6207471121762013e-07, "loss": 1.0781, "step": 27610 }, { "epoch": 0.83, "learning_rate": 3.6194828606007757e-07, "loss": 1.1224, "step": 27611 }, { "epoch": 0.83, "learning_rate": 3.618218812557578e-07, "loss": 1.1182, "step": 27612 }, { "epoch": 0.83, "learning_rate": 3.6169549680586416e-07, "loss": 1.1451, "step": 27613 }, { "epoch": 0.83, "learning_rate": 3.615691327115994e-07, "loss": 1.156, "step": 27614 }, { "epoch": 0.83, "learning_rate": 3.614427889741662e-07, "loss": 1.0848, "step": 27615 }, { "epoch": 0.83, "learning_rate": 3.613164655947679e-07, "loss": 1.0098, "step": 27616 }, { "epoch": 0.83, "learning_rate": 3.611901625746067e-07, "loss": 1.1785, "step": 27617 }, { "epoch": 0.83, "learning_rate": 3.6106387991488576e-07, "loss": 1.127, "step": 27618 }, { "epoch": 0.83, "learning_rate": 3.6093761761680583e-07, "loss": 1.0461, "step": 27619 }, { "epoch": 0.83, "learning_rate": 3.608113756815698e-07, "loss": 1.0198, "step": 27620 }, { "epoch": 0.83, "learning_rate": 3.6068515411037896e-07, "loss": 1.0352, "step": 27621 }, { "epoch": 0.83, "learning_rate": 3.6055895290443537e-07, "loss": 1.0859, "step": 27622 }, { "epoch": 0.83, "learning_rate": 3.6043277206494006e-07, "loss": 1.11, "step": 27623 }, { "epoch": 0.83, "learning_rate": 3.6030661159309423e-07, "loss": 1.0654, "step": 27624 }, { "epoch": 0.83, "learning_rate": 3.601804714900989e-07, "loss": 1.2301, "step": 27625 }, { "epoch": 0.83, "learning_rate": 3.600543517571556e-07, "loss": 1.1696, "step": 27626 }, { "epoch": 0.83, "learning_rate": 3.599282523954636e-07, "loss": 1.0473, "step": 27627 }, { "epoch": 0.83, "learning_rate": 3.59802173406224e-07, "loss": 1.1361, "step": 27628 }, { "epoch": 0.83, "learning_rate": 3.596761147906369e-07, "loss": 1.1396, "step": 27629 }, { "epoch": 0.83, "learning_rate": 3.5955007654990244e-07, "loss": 1.1722, "step": 27630 }, { "epoch": 0.83, "learning_rate": 3.594240586852207e-07, "loss": 1.0685, "step": 27631 }, { "epoch": 0.83, "learning_rate": 3.592980611977906e-07, "loss": 1.2556, "step": 27632 }, { "epoch": 0.83, "learning_rate": 3.5917208408881214e-07, "loss": 1.1249, "step": 27633 }, { "epoch": 0.83, "learning_rate": 3.590461273594842e-07, "loss": 1.0536, "step": 27634 }, { "epoch": 0.83, "learning_rate": 3.5892019101100655e-07, "loss": 1.1321, "step": 27635 }, { "epoch": 0.83, "learning_rate": 3.587942750445769e-07, "loss": 1.1521, "step": 27636 }, { "epoch": 0.83, "learning_rate": 3.586683794613946e-07, "loss": 1.1011, "step": 27637 }, { "epoch": 0.83, "learning_rate": 3.585425042626581e-07, "loss": 1.0349, "step": 27638 }, { "epoch": 0.83, "learning_rate": 3.584166494495661e-07, "loss": 1.0675, "step": 27639 }, { "epoch": 0.83, "learning_rate": 3.5829081502331554e-07, "loss": 1.1006, "step": 27640 }, { "epoch": 0.83, "learning_rate": 3.5816500098510483e-07, "loss": 1.0369, "step": 27641 }, { "epoch": 0.83, "learning_rate": 3.580392073361322e-07, "loss": 1.0822, "step": 27642 }, { "epoch": 0.83, "learning_rate": 3.5791343407759417e-07, "loss": 1.2359, "step": 27643 }, { "epoch": 0.83, "learning_rate": 3.5778768121068953e-07, "loss": 1.1511, "step": 27644 }, { "epoch": 0.83, "learning_rate": 3.576619487366137e-07, "loss": 1.1182, "step": 27645 }, { "epoch": 0.83, "learning_rate": 3.575362366565643e-07, "loss": 1.1125, "step": 27646 }, { "epoch": 0.83, "learning_rate": 3.5741054497173826e-07, "loss": 1.0973, "step": 27647 }, { "epoch": 0.83, "learning_rate": 3.572848736833326e-07, "loss": 1.1161, "step": 27648 }, { "epoch": 0.83, "learning_rate": 3.571592227925422e-07, "loss": 1.1511, "step": 27649 }, { "epoch": 0.83, "learning_rate": 3.5703359230056384e-07, "loss": 1.0878, "step": 27650 }, { "epoch": 0.83, "learning_rate": 3.5690798220859385e-07, "loss": 1.1016, "step": 27651 }, { "epoch": 0.83, "learning_rate": 3.567823925178274e-07, "loss": 1.1032, "step": 27652 }, { "epoch": 0.83, "learning_rate": 3.566568232294607e-07, "loss": 0.9921, "step": 27653 }, { "epoch": 0.83, "learning_rate": 3.565312743446886e-07, "loss": 1.0814, "step": 27654 }, { "epoch": 0.83, "learning_rate": 3.5640574586470663e-07, "loss": 1.2007, "step": 27655 }, { "epoch": 0.83, "learning_rate": 3.562802377907093e-07, "loss": 1.032, "step": 27656 }, { "epoch": 0.83, "learning_rate": 3.561547501238924e-07, "loss": 1.0862, "step": 27657 }, { "epoch": 0.83, "learning_rate": 3.5602928286544907e-07, "loss": 1.1989, "step": 27658 }, { "epoch": 0.83, "learning_rate": 3.559038360165745e-07, "loss": 1.108, "step": 27659 }, { "epoch": 0.83, "learning_rate": 3.5577840957846275e-07, "loss": 1.1422, "step": 27660 }, { "epoch": 0.83, "learning_rate": 3.5565300355230844e-07, "loss": 1.1675, "step": 27661 }, { "epoch": 0.83, "learning_rate": 3.555276179393041e-07, "loss": 1.2226, "step": 27662 }, { "epoch": 0.83, "learning_rate": 3.554022527406442e-07, "loss": 1.1162, "step": 27663 }, { "epoch": 0.83, "learning_rate": 3.552769079575219e-07, "loss": 1.0687, "step": 27664 }, { "epoch": 0.83, "learning_rate": 3.551515835911309e-07, "loss": 1.1178, "step": 27665 }, { "epoch": 0.83, "learning_rate": 3.5502627964266346e-07, "loss": 1.1406, "step": 27666 }, { "epoch": 0.83, "learning_rate": 3.549009961133129e-07, "loss": 1.0988, "step": 27667 }, { "epoch": 0.83, "learning_rate": 3.547757330042714e-07, "loss": 1.2415, "step": 27668 }, { "epoch": 0.83, "learning_rate": 3.546504903167322e-07, "loss": 1.0657, "step": 27669 }, { "epoch": 0.83, "learning_rate": 3.5452526805188736e-07, "loss": 1.0689, "step": 27670 }, { "epoch": 0.83, "learning_rate": 3.5440006621092817e-07, "loss": 1.0928, "step": 27671 }, { "epoch": 0.83, "learning_rate": 3.54274884795047e-07, "loss": 1.0305, "step": 27672 }, { "epoch": 0.83, "learning_rate": 3.5414972380543535e-07, "loss": 1.0945, "step": 27673 }, { "epoch": 0.83, "learning_rate": 3.5402458324328564e-07, "loss": 1.1926, "step": 27674 }, { "epoch": 0.83, "learning_rate": 3.538994631097875e-07, "loss": 1.2086, "step": 27675 }, { "epoch": 0.83, "learning_rate": 3.537743634061333e-07, "loss": 1.1443, "step": 27676 }, { "epoch": 0.83, "learning_rate": 3.536492841335132e-07, "loss": 1.0367, "step": 27677 }, { "epoch": 0.83, "learning_rate": 3.5352422529311817e-07, "loss": 0.9786, "step": 27678 }, { "epoch": 0.83, "learning_rate": 3.533991868861389e-07, "loss": 1.072, "step": 27679 }, { "epoch": 0.83, "learning_rate": 3.532741689137656e-07, "loss": 1.105, "step": 27680 }, { "epoch": 0.83, "learning_rate": 3.5314917137718813e-07, "loss": 1.1746, "step": 27681 }, { "epoch": 0.83, "learning_rate": 3.5302419427759667e-07, "loss": 1.0423, "step": 27682 }, { "epoch": 0.83, "learning_rate": 3.5289923761618135e-07, "loss": 1.0715, "step": 27683 }, { "epoch": 0.83, "learning_rate": 3.5277430139413066e-07, "loss": 1.0169, "step": 27684 }, { "epoch": 0.83, "learning_rate": 3.526493856126345e-07, "loss": 1.1634, "step": 27685 }, { "epoch": 0.83, "learning_rate": 3.5252449027288195e-07, "loss": 1.0442, "step": 27686 }, { "epoch": 0.83, "learning_rate": 3.523996153760628e-07, "loss": 1.0397, "step": 27687 }, { "epoch": 0.83, "learning_rate": 3.5227476092336425e-07, "loss": 1.1497, "step": 27688 }, { "epoch": 0.83, "learning_rate": 3.521499269159756e-07, "loss": 1.061, "step": 27689 }, { "epoch": 0.83, "learning_rate": 3.5202511335508507e-07, "loss": 1.1376, "step": 27690 }, { "epoch": 0.83, "learning_rate": 3.5190032024188166e-07, "loss": 1.0604, "step": 27691 }, { "epoch": 0.83, "learning_rate": 3.517755475775522e-07, "loss": 1.0908, "step": 27692 }, { "epoch": 0.83, "learning_rate": 3.5165079536328473e-07, "loss": 0.986, "step": 27693 }, { "epoch": 0.83, "learning_rate": 3.515260636002671e-07, "loss": 1.1179, "step": 27694 }, { "epoch": 0.83, "learning_rate": 3.514013522896864e-07, "loss": 1.0794, "step": 27695 }, { "epoch": 0.83, "learning_rate": 3.5127666143273094e-07, "loss": 1.1234, "step": 27696 }, { "epoch": 0.83, "learning_rate": 3.511519910305861e-07, "loss": 1.1511, "step": 27697 }, { "epoch": 0.83, "learning_rate": 3.510273410844392e-07, "loss": 1.1923, "step": 27698 }, { "epoch": 0.83, "learning_rate": 3.5090271159547717e-07, "loss": 1.1744, "step": 27699 }, { "epoch": 0.83, "learning_rate": 3.507781025648868e-07, "loss": 1.1301, "step": 27700 }, { "epoch": 0.83, "learning_rate": 3.5065351399385326e-07, "loss": 1.1721, "step": 27701 }, { "epoch": 0.83, "learning_rate": 3.5052894588356314e-07, "loss": 1.1497, "step": 27702 }, { "epoch": 0.83, "learning_rate": 3.504043982352021e-07, "loss": 1.0233, "step": 27703 }, { "epoch": 0.83, "learning_rate": 3.502798710499561e-07, "loss": 1.04, "step": 27704 }, { "epoch": 0.83, "learning_rate": 3.501553643290104e-07, "loss": 1.1709, "step": 27705 }, { "epoch": 0.83, "learning_rate": 3.5003087807355007e-07, "loss": 1.1793, "step": 27706 }, { "epoch": 0.83, "learning_rate": 3.4990641228476035e-07, "loss": 1.0991, "step": 27707 }, { "epoch": 0.83, "learning_rate": 3.4978196696382665e-07, "loss": 0.9733, "step": 27708 }, { "epoch": 0.83, "learning_rate": 3.496575421119325e-07, "loss": 1.0484, "step": 27709 }, { "epoch": 0.83, "learning_rate": 3.49533137730263e-07, "loss": 1.1482, "step": 27710 }, { "epoch": 0.83, "learning_rate": 3.494087538200022e-07, "loss": 1.021, "step": 27711 }, { "epoch": 0.83, "learning_rate": 3.4928439038233427e-07, "loss": 1.2548, "step": 27712 }, { "epoch": 0.83, "learning_rate": 3.491600474184437e-07, "loss": 1.0128, "step": 27713 }, { "epoch": 0.83, "learning_rate": 3.4903572492951316e-07, "loss": 1.1584, "step": 27714 }, { "epoch": 0.83, "learning_rate": 3.489114229167265e-07, "loss": 1.0459, "step": 27715 }, { "epoch": 0.83, "learning_rate": 3.487871413812671e-07, "loss": 1.0554, "step": 27716 }, { "epoch": 0.83, "learning_rate": 3.486628803243186e-07, "loss": 1.0875, "step": 27717 }, { "epoch": 0.84, "learning_rate": 3.4853863974706274e-07, "loss": 1.246, "step": 27718 }, { "epoch": 0.84, "learning_rate": 3.4841441965068306e-07, "loss": 1.1842, "step": 27719 }, { "epoch": 0.84, "learning_rate": 3.4829022003636165e-07, "loss": 1.174, "step": 27720 }, { "epoch": 0.84, "learning_rate": 3.481660409052812e-07, "loss": 1.0848, "step": 27721 }, { "epoch": 0.84, "learning_rate": 3.48041882258624e-07, "loss": 0.975, "step": 27722 }, { "epoch": 0.84, "learning_rate": 3.4791774409757145e-07, "loss": 1.0842, "step": 27723 }, { "epoch": 0.84, "learning_rate": 3.4779362642330534e-07, "loss": 1.241, "step": 27724 }, { "epoch": 0.84, "learning_rate": 3.476695292370072e-07, "loss": 1.1599, "step": 27725 }, { "epoch": 0.84, "learning_rate": 3.4754545253985944e-07, "loss": 1.0612, "step": 27726 }, { "epoch": 0.84, "learning_rate": 3.474213963330414e-07, "loss": 0.9987, "step": 27727 }, { "epoch": 0.84, "learning_rate": 3.4729736061773514e-07, "loss": 1.0041, "step": 27728 }, { "epoch": 0.84, "learning_rate": 3.471733453951212e-07, "loss": 1.1842, "step": 27729 }, { "epoch": 0.84, "learning_rate": 3.470493506663808e-07, "loss": 1.1536, "step": 27730 }, { "epoch": 0.84, "learning_rate": 3.4692537643269297e-07, "loss": 1.2058, "step": 27731 }, { "epoch": 0.84, "learning_rate": 3.4680142269523875e-07, "loss": 0.9529, "step": 27732 }, { "epoch": 0.84, "learning_rate": 3.46677489455198e-07, "loss": 1.1302, "step": 27733 }, { "epoch": 0.84, "learning_rate": 3.465535767137504e-07, "loss": 1.0698, "step": 27734 }, { "epoch": 0.84, "learning_rate": 3.464296844720755e-07, "loss": 1.1058, "step": 27735 }, { "epoch": 0.84, "learning_rate": 3.463058127313529e-07, "loss": 1.1447, "step": 27736 }, { "epoch": 0.84, "learning_rate": 3.461819614927617e-07, "loss": 1.157, "step": 27737 }, { "epoch": 0.84, "learning_rate": 3.4605813075748093e-07, "loss": 1.0743, "step": 27738 }, { "epoch": 0.84, "learning_rate": 3.459343205266899e-07, "loss": 1.0846, "step": 27739 }, { "epoch": 0.84, "learning_rate": 3.4581053080156635e-07, "loss": 0.9811, "step": 27740 }, { "epoch": 0.84, "learning_rate": 3.456867615832887e-07, "loss": 1.075, "step": 27741 }, { "epoch": 0.84, "learning_rate": 3.4556301287303585e-07, "loss": 1.0593, "step": 27742 }, { "epoch": 0.84, "learning_rate": 3.454392846719859e-07, "loss": 1.1198, "step": 27743 }, { "epoch": 0.84, "learning_rate": 3.4531557698131574e-07, "loss": 1.11, "step": 27744 }, { "epoch": 0.84, "learning_rate": 3.451918898022036e-07, "loss": 1.057, "step": 27745 }, { "epoch": 0.84, "learning_rate": 3.4506822313582683e-07, "loss": 0.9813, "step": 27746 }, { "epoch": 0.84, "learning_rate": 3.4494457698336284e-07, "loss": 1.1547, "step": 27747 }, { "epoch": 0.84, "learning_rate": 3.448209513459891e-07, "loss": 1.181, "step": 27748 }, { "epoch": 0.84, "learning_rate": 3.4469734622488123e-07, "loss": 1.1035, "step": 27749 }, { "epoch": 0.84, "learning_rate": 3.445737616212166e-07, "loss": 1.1123, "step": 27750 }, { "epoch": 0.84, "learning_rate": 3.444501975361719e-07, "loss": 1.0784, "step": 27751 }, { "epoch": 0.84, "learning_rate": 3.4432665397092337e-07, "loss": 0.9749, "step": 27752 }, { "epoch": 0.84, "learning_rate": 3.4420313092664663e-07, "loss": 1.0455, "step": 27753 }, { "epoch": 0.84, "learning_rate": 3.440796284045178e-07, "loss": 1.1337, "step": 27754 }, { "epoch": 0.84, "learning_rate": 3.4395614640571254e-07, "loss": 1.1089, "step": 27755 }, { "epoch": 0.84, "learning_rate": 3.4383268493140693e-07, "loss": 1.1356, "step": 27756 }, { "epoch": 0.84, "learning_rate": 3.4370924398277496e-07, "loss": 1.0447, "step": 27757 }, { "epoch": 0.84, "learning_rate": 3.4358582356099263e-07, "loss": 1.1302, "step": 27758 }, { "epoch": 0.84, "learning_rate": 3.434624236672349e-07, "loss": 1.1585, "step": 27759 }, { "epoch": 0.84, "learning_rate": 3.4333904430267603e-07, "loss": 0.9686, "step": 27760 }, { "epoch": 0.84, "learning_rate": 3.4321568546849063e-07, "loss": 1.184, "step": 27761 }, { "epoch": 0.84, "learning_rate": 3.430923471658534e-07, "loss": 1.0906, "step": 27762 }, { "epoch": 0.84, "learning_rate": 3.429690293959381e-07, "loss": 1.06, "step": 27763 }, { "epoch": 0.84, "learning_rate": 3.428457321599191e-07, "loss": 1.1834, "step": 27764 }, { "epoch": 0.84, "learning_rate": 3.4272245545897004e-07, "loss": 1.0263, "step": 27765 }, { "epoch": 0.84, "learning_rate": 3.425991992942637e-07, "loss": 1.0282, "step": 27766 }, { "epoch": 0.84, "learning_rate": 3.424759636669742e-07, "loss": 1.1958, "step": 27767 }, { "epoch": 0.84, "learning_rate": 3.4235274857827406e-07, "loss": 1.1205, "step": 27768 }, { "epoch": 0.84, "learning_rate": 3.4222955402933745e-07, "loss": 1.1821, "step": 27769 }, { "epoch": 0.84, "learning_rate": 3.421063800213353e-07, "loss": 1.0934, "step": 27770 }, { "epoch": 0.84, "learning_rate": 3.4198322655544154e-07, "loss": 1.1522, "step": 27771 }, { "epoch": 0.84, "learning_rate": 3.4186009363282815e-07, "loss": 1.0111, "step": 27772 }, { "epoch": 0.84, "learning_rate": 3.4173698125466754e-07, "loss": 1.1982, "step": 27773 }, { "epoch": 0.84, "learning_rate": 3.41613889422131e-07, "loss": 1.2665, "step": 27774 }, { "epoch": 0.84, "learning_rate": 3.4149081813639075e-07, "loss": 1.0811, "step": 27775 }, { "epoch": 0.84, "learning_rate": 3.413677673986182e-07, "loss": 1.0826, "step": 27776 }, { "epoch": 0.84, "learning_rate": 3.41244737209985e-07, "loss": 1.1696, "step": 27777 }, { "epoch": 0.84, "learning_rate": 3.4112172757166274e-07, "loss": 1.2258, "step": 27778 }, { "epoch": 0.84, "learning_rate": 3.4099873848482125e-07, "loss": 1.2277, "step": 27779 }, { "epoch": 0.84, "learning_rate": 3.408757699506321e-07, "loss": 1.1533, "step": 27780 }, { "epoch": 0.84, "learning_rate": 3.4075282197026575e-07, "loss": 1.189, "step": 27781 }, { "epoch": 0.84, "learning_rate": 3.40629894544893e-07, "loss": 1.1239, "step": 27782 }, { "epoch": 0.84, "learning_rate": 3.4050698767568337e-07, "loss": 1.1805, "step": 27783 }, { "epoch": 0.84, "learning_rate": 3.403841013638068e-07, "loss": 1.0838, "step": 27784 }, { "epoch": 0.84, "learning_rate": 3.402612356104337e-07, "loss": 1.1426, "step": 27785 }, { "epoch": 0.84, "learning_rate": 3.401383904167335e-07, "loss": 1.089, "step": 27786 }, { "epoch": 0.84, "learning_rate": 3.400155657838755e-07, "loss": 1.0806, "step": 27787 }, { "epoch": 0.84, "learning_rate": 3.39892761713029e-07, "loss": 0.9907, "step": 27788 }, { "epoch": 0.84, "learning_rate": 3.397699782053632e-07, "loss": 1.1749, "step": 27789 }, { "epoch": 0.84, "learning_rate": 3.396472152620467e-07, "loss": 1.0522, "step": 27790 }, { "epoch": 0.84, "learning_rate": 3.3952447288424896e-07, "loss": 1.2151, "step": 27791 }, { "epoch": 0.84, "learning_rate": 3.3940175107313704e-07, "loss": 1.1173, "step": 27792 }, { "epoch": 0.84, "learning_rate": 3.392790498298798e-07, "loss": 1.074, "step": 27793 }, { "epoch": 0.84, "learning_rate": 3.3915636915564573e-07, "loss": 1.1384, "step": 27794 }, { "epoch": 0.84, "learning_rate": 3.3903370905160246e-07, "loss": 1.072, "step": 27795 }, { "epoch": 0.84, "learning_rate": 3.3891106951891713e-07, "loss": 1.1412, "step": 27796 }, { "epoch": 0.84, "learning_rate": 3.387884505587577e-07, "loss": 1.0065, "step": 27797 }, { "epoch": 0.84, "learning_rate": 3.3866585217229104e-07, "loss": 1.0108, "step": 27798 }, { "epoch": 0.84, "learning_rate": 3.3854327436068535e-07, "loss": 1.0399, "step": 27799 }, { "epoch": 0.84, "learning_rate": 3.384207171251061e-07, "loss": 1.1353, "step": 27800 }, { "epoch": 0.84, "learning_rate": 3.382981804667204e-07, "loss": 1.1016, "step": 27801 }, { "epoch": 0.84, "learning_rate": 3.3817566438669513e-07, "loss": 1.0093, "step": 27802 }, { "epoch": 0.84, "learning_rate": 3.3805316888619625e-07, "loss": 1.0211, "step": 27803 }, { "epoch": 0.84, "learning_rate": 3.3793069396639067e-07, "loss": 1.1308, "step": 27804 }, { "epoch": 0.84, "learning_rate": 3.3780823962844296e-07, "loss": 1.0653, "step": 27805 }, { "epoch": 0.84, "learning_rate": 3.376858058735194e-07, "loss": 1.0998, "step": 27806 }, { "epoch": 0.84, "learning_rate": 3.375633927027855e-07, "loss": 1.0699, "step": 27807 }, { "epoch": 0.84, "learning_rate": 3.374410001174072e-07, "loss": 1.0677, "step": 27808 }, { "epoch": 0.84, "learning_rate": 3.3731862811854867e-07, "loss": 1.0175, "step": 27809 }, { "epoch": 0.84, "learning_rate": 3.3719627670737523e-07, "loss": 1.1518, "step": 27810 }, { "epoch": 0.84, "learning_rate": 3.370739458850514e-07, "loss": 1.0659, "step": 27811 }, { "epoch": 0.84, "learning_rate": 3.369516356527419e-07, "loss": 1.083, "step": 27812 }, { "epoch": 0.84, "learning_rate": 3.3682934601161175e-07, "loss": 1.0094, "step": 27813 }, { "epoch": 0.84, "learning_rate": 3.367070769628239e-07, "loss": 1.2205, "step": 27814 }, { "epoch": 0.84, "learning_rate": 3.365848285075427e-07, "loss": 1.0499, "step": 27815 }, { "epoch": 0.84, "learning_rate": 3.364626006469321e-07, "loss": 0.9858, "step": 27816 }, { "epoch": 0.84, "learning_rate": 3.363403933821555e-07, "loss": 1.1303, "step": 27817 }, { "epoch": 0.84, "learning_rate": 3.362182067143763e-07, "loss": 1.0743, "step": 27818 }, { "epoch": 0.84, "learning_rate": 3.360960406447575e-07, "loss": 1.0211, "step": 27819 }, { "epoch": 0.84, "learning_rate": 3.359738951744623e-07, "loss": 1.1185, "step": 27820 }, { "epoch": 0.84, "learning_rate": 3.3585177030465403e-07, "loss": 1.0624, "step": 27821 }, { "epoch": 0.84, "learning_rate": 3.357296660364942e-07, "loss": 1.1002, "step": 27822 }, { "epoch": 0.84, "learning_rate": 3.356075823711452e-07, "loss": 1.1184, "step": 27823 }, { "epoch": 0.84, "learning_rate": 3.3548551930977e-07, "loss": 1.2523, "step": 27824 }, { "epoch": 0.84, "learning_rate": 3.353634768535305e-07, "loss": 1.0523, "step": 27825 }, { "epoch": 0.84, "learning_rate": 3.352414550035876e-07, "loss": 1.0657, "step": 27826 }, { "epoch": 0.84, "learning_rate": 3.351194537611038e-07, "loss": 0.9739, "step": 27827 }, { "epoch": 0.84, "learning_rate": 3.349974731272398e-07, "loss": 1.1296, "step": 27828 }, { "epoch": 0.84, "learning_rate": 3.3487551310315725e-07, "loss": 1.0595, "step": 27829 }, { "epoch": 0.84, "learning_rate": 3.347535736900176e-07, "loss": 1.0803, "step": 27830 }, { "epoch": 0.84, "learning_rate": 3.346316548889808e-07, "loss": 1.024, "step": 27831 }, { "epoch": 0.84, "learning_rate": 3.345097567012076e-07, "loss": 1.0786, "step": 27832 }, { "epoch": 0.84, "learning_rate": 3.3438787912785846e-07, "loss": 1.0499, "step": 27833 }, { "epoch": 0.84, "learning_rate": 3.342660221700944e-07, "loss": 1.0018, "step": 27834 }, { "epoch": 0.84, "learning_rate": 3.3414418582907393e-07, "loss": 1.1658, "step": 27835 }, { "epoch": 0.84, "learning_rate": 3.3402237010595804e-07, "loss": 0.9757, "step": 27836 }, { "epoch": 0.84, "learning_rate": 3.339005750019059e-07, "loss": 1.0463, "step": 27837 }, { "epoch": 0.84, "learning_rate": 3.3377880051807754e-07, "loss": 1.0521, "step": 27838 }, { "epoch": 0.84, "learning_rate": 3.336570466556313e-07, "loss": 1.0168, "step": 27839 }, { "epoch": 0.84, "learning_rate": 3.335353134157265e-07, "loss": 1.0563, "step": 27840 }, { "epoch": 0.84, "learning_rate": 3.334136007995223e-07, "loss": 1.1352, "step": 27841 }, { "epoch": 0.84, "learning_rate": 3.332919088081771e-07, "loss": 1.1008, "step": 27842 }, { "epoch": 0.84, "learning_rate": 3.331702374428492e-07, "loss": 1.2423, "step": 27843 }, { "epoch": 0.84, "learning_rate": 3.330485867046973e-07, "loss": 1.0189, "step": 27844 }, { "epoch": 0.84, "learning_rate": 3.3292695659487894e-07, "loss": 1.0581, "step": 27845 }, { "epoch": 0.84, "learning_rate": 3.328053471145526e-07, "loss": 1.1301, "step": 27846 }, { "epoch": 0.84, "learning_rate": 3.326837582648759e-07, "loss": 0.9937, "step": 27847 }, { "epoch": 0.84, "learning_rate": 3.325621900470055e-07, "loss": 1.2081, "step": 27848 }, { "epoch": 0.84, "learning_rate": 3.3244064246209907e-07, "loss": 1.1569, "step": 27849 }, { "epoch": 0.84, "learning_rate": 3.3231911551131395e-07, "loss": 1.0775, "step": 27850 }, { "epoch": 0.84, "learning_rate": 3.3219760919580737e-07, "loss": 1.0235, "step": 27851 }, { "epoch": 0.84, "learning_rate": 3.3207612351673495e-07, "loss": 1.1177, "step": 27852 }, { "epoch": 0.84, "learning_rate": 3.3195465847525395e-07, "loss": 1.1844, "step": 27853 }, { "epoch": 0.84, "learning_rate": 3.3183321407252e-07, "loss": 1.0485, "step": 27854 }, { "epoch": 0.84, "learning_rate": 3.3171179030969005e-07, "loss": 1.199, "step": 27855 }, { "epoch": 0.84, "learning_rate": 3.3159038718791976e-07, "loss": 1.0787, "step": 27856 }, { "epoch": 0.84, "learning_rate": 3.3146900470836437e-07, "loss": 1.0734, "step": 27857 }, { "epoch": 0.84, "learning_rate": 3.313476428721796e-07, "loss": 1.148, "step": 27858 }, { "epoch": 0.84, "learning_rate": 3.3122630168052063e-07, "loss": 0.986, "step": 27859 }, { "epoch": 0.84, "learning_rate": 3.3110498113454346e-07, "loss": 1.1003, "step": 27860 }, { "epoch": 0.84, "learning_rate": 3.309836812354017e-07, "loss": 1.0901, "step": 27861 }, { "epoch": 0.84, "learning_rate": 3.308624019842507e-07, "loss": 1.1388, "step": 27862 }, { "epoch": 0.84, "learning_rate": 3.307411433822449e-07, "loss": 1.1013, "step": 27863 }, { "epoch": 0.84, "learning_rate": 3.3061990543053923e-07, "loss": 1.0138, "step": 27864 }, { "epoch": 0.84, "learning_rate": 3.304986881302866e-07, "loss": 1.0796, "step": 27865 }, { "epoch": 0.84, "learning_rate": 3.303774914826419e-07, "loss": 1.0906, "step": 27866 }, { "epoch": 0.84, "learning_rate": 3.302563154887581e-07, "loss": 1.0986, "step": 27867 }, { "epoch": 0.84, "learning_rate": 3.3013516014978955e-07, "loss": 1.1227, "step": 27868 }, { "epoch": 0.84, "learning_rate": 3.30014025466889e-07, "loss": 1.2007, "step": 27869 }, { "epoch": 0.84, "learning_rate": 3.2989291144121e-07, "loss": 1.0938, "step": 27870 }, { "epoch": 0.84, "learning_rate": 3.297718180739054e-07, "loss": 1.0159, "step": 27871 }, { "epoch": 0.84, "learning_rate": 3.2965074536612766e-07, "loss": 1.1542, "step": 27872 }, { "epoch": 0.84, "learning_rate": 3.2952969331903005e-07, "loss": 0.9967, "step": 27873 }, { "epoch": 0.84, "learning_rate": 3.2940866193376414e-07, "loss": 1.1578, "step": 27874 }, { "epoch": 0.84, "learning_rate": 3.292876512114823e-07, "loss": 1.1638, "step": 27875 }, { "epoch": 0.84, "learning_rate": 3.2916666115333646e-07, "loss": 1.1032, "step": 27876 }, { "epoch": 0.84, "learning_rate": 3.29045691760479e-07, "loss": 1.028, "step": 27877 }, { "epoch": 0.84, "learning_rate": 3.289247430340606e-07, "loss": 0.9977, "step": 27878 }, { "epoch": 0.84, "learning_rate": 3.288038149752329e-07, "loss": 1.118, "step": 27879 }, { "epoch": 0.84, "learning_rate": 3.286829075851472e-07, "loss": 1.0949, "step": 27880 }, { "epoch": 0.84, "learning_rate": 3.285620208649545e-07, "loss": 1.0939, "step": 27881 }, { "epoch": 0.84, "learning_rate": 3.284411548158062e-07, "loss": 1.0103, "step": 27882 }, { "epoch": 0.84, "learning_rate": 3.2832030943885177e-07, "loss": 1.1193, "step": 27883 }, { "epoch": 0.84, "learning_rate": 3.281994847352418e-07, "loss": 1.0767, "step": 27884 }, { "epoch": 0.84, "learning_rate": 3.2807868070612704e-07, "loss": 1.0308, "step": 27885 }, { "epoch": 0.84, "learning_rate": 3.279578973526576e-07, "loss": 1.1294, "step": 27886 }, { "epoch": 0.84, "learning_rate": 3.278371346759823e-07, "loss": 1.1571, "step": 27887 }, { "epoch": 0.84, "learning_rate": 3.277163926772514e-07, "loss": 1.0747, "step": 27888 }, { "epoch": 0.84, "learning_rate": 3.275956713576142e-07, "loss": 1.1056, "step": 27889 }, { "epoch": 0.84, "learning_rate": 3.274749707182204e-07, "loss": 1.1757, "step": 27890 }, { "epoch": 0.84, "learning_rate": 3.2735429076021813e-07, "loss": 1.1392, "step": 27891 }, { "epoch": 0.84, "learning_rate": 3.272336314847566e-07, "loss": 1.0668, "step": 27892 }, { "epoch": 0.84, "learning_rate": 3.271129928929845e-07, "loss": 1.1082, "step": 27893 }, { "epoch": 0.84, "learning_rate": 3.2699237498605014e-07, "loss": 1.0096, "step": 27894 }, { "epoch": 0.84, "learning_rate": 3.268717777651026e-07, "loss": 1.1647, "step": 27895 }, { "epoch": 0.84, "learning_rate": 3.2675120123128817e-07, "loss": 1.0109, "step": 27896 }, { "epoch": 0.84, "learning_rate": 3.26630645385756e-07, "loss": 1.0129, "step": 27897 }, { "epoch": 0.84, "learning_rate": 3.265101102296531e-07, "loss": 1.0847, "step": 27898 }, { "epoch": 0.84, "learning_rate": 3.2638959576412723e-07, "loss": 1.1334, "step": 27899 }, { "epoch": 0.84, "learning_rate": 3.262691019903255e-07, "loss": 1.0257, "step": 27900 }, { "epoch": 0.84, "learning_rate": 3.2614862890939516e-07, "loss": 1.0452, "step": 27901 }, { "epoch": 0.84, "learning_rate": 3.260281765224829e-07, "loss": 1.0524, "step": 27902 }, { "epoch": 0.84, "learning_rate": 3.25907744830736e-07, "loss": 1.0766, "step": 27903 }, { "epoch": 0.84, "learning_rate": 3.257873338352996e-07, "loss": 1.1868, "step": 27904 }, { "epoch": 0.84, "learning_rate": 3.2566694353732054e-07, "loss": 1.1581, "step": 27905 }, { "epoch": 0.84, "learning_rate": 3.2554657393794516e-07, "loss": 1.0547, "step": 27906 }, { "epoch": 0.84, "learning_rate": 3.254262250383192e-07, "loss": 1.0855, "step": 27907 }, { "epoch": 0.84, "learning_rate": 3.253058968395886e-07, "loss": 1.0632, "step": 27908 }, { "epoch": 0.84, "learning_rate": 3.2518558934289816e-07, "loss": 0.9814, "step": 27909 }, { "epoch": 0.84, "learning_rate": 3.250653025493933e-07, "loss": 1.0945, "step": 27910 }, { "epoch": 0.84, "learning_rate": 3.249450364602194e-07, "loss": 1.2513, "step": 27911 }, { "epoch": 0.84, "learning_rate": 3.248247910765218e-07, "loss": 1.1272, "step": 27912 }, { "epoch": 0.84, "learning_rate": 3.247045663994439e-07, "loss": 1.063, "step": 27913 }, { "epoch": 0.84, "learning_rate": 3.245843624301309e-07, "loss": 1.053, "step": 27914 }, { "epoch": 0.84, "learning_rate": 3.24464179169727e-07, "loss": 1.1428, "step": 27915 }, { "epoch": 0.84, "learning_rate": 3.2434401661937703e-07, "loss": 1.0334, "step": 27916 }, { "epoch": 0.84, "learning_rate": 3.2422387478022343e-07, "loss": 1.1378, "step": 27917 }, { "epoch": 0.84, "learning_rate": 3.2410375365341086e-07, "loss": 1.1412, "step": 27918 }, { "epoch": 0.84, "learning_rate": 3.239836532400825e-07, "loss": 1.0353, "step": 27919 }, { "epoch": 0.84, "learning_rate": 3.23863573541382e-07, "loss": 1.158, "step": 27920 }, { "epoch": 0.84, "learning_rate": 3.237435145584525e-07, "loss": 1.1462, "step": 27921 }, { "epoch": 0.84, "learning_rate": 3.2362347629243616e-07, "loss": 1.1285, "step": 27922 }, { "epoch": 0.84, "learning_rate": 3.2350345874447605e-07, "loss": 0.9736, "step": 27923 }, { "epoch": 0.84, "learning_rate": 3.2338346191571476e-07, "loss": 1.2018, "step": 27924 }, { "epoch": 0.84, "learning_rate": 3.232634858072947e-07, "loss": 1.1505, "step": 27925 }, { "epoch": 0.84, "learning_rate": 3.231435304203581e-07, "loss": 1.1451, "step": 27926 }, { "epoch": 0.84, "learning_rate": 3.2302359575604626e-07, "loss": 1.0567, "step": 27927 }, { "epoch": 0.84, "learning_rate": 3.229036818155018e-07, "loss": 1.2516, "step": 27928 }, { "epoch": 0.84, "learning_rate": 3.2278378859986583e-07, "loss": 1.1739, "step": 27929 }, { "epoch": 0.84, "learning_rate": 3.226639161102793e-07, "loss": 1.1461, "step": 27930 }, { "epoch": 0.84, "learning_rate": 3.225440643478836e-07, "loss": 1.16, "step": 27931 }, { "epoch": 0.84, "learning_rate": 3.2242423331382e-07, "loss": 1.0499, "step": 27932 }, { "epoch": 0.84, "learning_rate": 3.223044230092287e-07, "loss": 1.0629, "step": 27933 }, { "epoch": 0.84, "learning_rate": 3.22184633435251e-07, "loss": 1.0526, "step": 27934 }, { "epoch": 0.84, "learning_rate": 3.2206486459302606e-07, "loss": 1.1321, "step": 27935 }, { "epoch": 0.84, "learning_rate": 3.219451164836948e-07, "loss": 1.0377, "step": 27936 }, { "epoch": 0.84, "learning_rate": 3.218253891083972e-07, "loss": 1.145, "step": 27937 }, { "epoch": 0.84, "learning_rate": 3.217056824682732e-07, "loss": 1.0885, "step": 27938 }, { "epoch": 0.84, "learning_rate": 3.215859965644613e-07, "loss": 1.1053, "step": 27939 }, { "epoch": 0.84, "learning_rate": 3.21466331398102e-07, "loss": 1.0855, "step": 27940 }, { "epoch": 0.84, "learning_rate": 3.2134668697033357e-07, "loss": 1.1257, "step": 27941 }, { "epoch": 0.84, "learning_rate": 3.2122706328229613e-07, "loss": 1.0328, "step": 27942 }, { "epoch": 0.84, "learning_rate": 3.211074603351272e-07, "loss": 1.0823, "step": 27943 }, { "epoch": 0.84, "learning_rate": 3.209878781299661e-07, "loss": 1.0764, "step": 27944 }, { "epoch": 0.84, "learning_rate": 3.208683166679505e-07, "loss": 1.0526, "step": 27945 }, { "epoch": 0.84, "learning_rate": 3.2074877595021926e-07, "loss": 1.026, "step": 27946 }, { "epoch": 0.84, "learning_rate": 3.2062925597791063e-07, "loss": 1.2189, "step": 27947 }, { "epoch": 0.84, "learning_rate": 3.205097567521612e-07, "loss": 1.045, "step": 27948 }, { "epoch": 0.84, "learning_rate": 3.2039027827410947e-07, "loss": 1.0847, "step": 27949 }, { "epoch": 0.84, "learning_rate": 3.2027082054489233e-07, "loss": 1.1205, "step": 27950 }, { "epoch": 0.84, "learning_rate": 3.2015138356564723e-07, "loss": 1.0579, "step": 27951 }, { "epoch": 0.84, "learning_rate": 3.20031967337511e-07, "loss": 1.0905, "step": 27952 }, { "epoch": 0.84, "learning_rate": 3.1991257186162083e-07, "loss": 1.0328, "step": 27953 }, { "epoch": 0.84, "learning_rate": 3.197931971391127e-07, "loss": 1.1481, "step": 27954 }, { "epoch": 0.84, "learning_rate": 3.196738431711241e-07, "loss": 1.0691, "step": 27955 }, { "epoch": 0.84, "learning_rate": 3.195545099587896e-07, "loss": 1.1142, "step": 27956 }, { "epoch": 0.84, "learning_rate": 3.1943519750324615e-07, "loss": 1.1149, "step": 27957 }, { "epoch": 0.84, "learning_rate": 3.193159058056297e-07, "loss": 1.2041, "step": 27958 }, { "epoch": 0.84, "learning_rate": 3.1919663486707583e-07, "loss": 1.0966, "step": 27959 }, { "epoch": 0.84, "learning_rate": 3.1907738468871906e-07, "loss": 1.1276, "step": 27960 }, { "epoch": 0.84, "learning_rate": 3.1895815527169553e-07, "loss": 1.0773, "step": 27961 }, { "epoch": 0.84, "learning_rate": 3.188389466171396e-07, "loss": 1.2846, "step": 27962 }, { "epoch": 0.84, "learning_rate": 3.187197587261867e-07, "loss": 1.0845, "step": 27963 }, { "epoch": 0.84, "learning_rate": 3.186005915999715e-07, "loss": 1.1092, "step": 27964 }, { "epoch": 0.84, "learning_rate": 3.184814452396276e-07, "loss": 1.1783, "step": 27965 }, { "epoch": 0.84, "learning_rate": 3.1836231964628984e-07, "loss": 1.1275, "step": 27966 }, { "epoch": 0.84, "learning_rate": 3.1824321482109175e-07, "loss": 1.0885, "step": 27967 }, { "epoch": 0.84, "learning_rate": 3.1812413076516837e-07, "loss": 1.0565, "step": 27968 }, { "epoch": 0.84, "learning_rate": 3.180050674796517e-07, "loss": 1.0718, "step": 27969 }, { "epoch": 0.84, "learning_rate": 3.178860249656759e-07, "loss": 1.1122, "step": 27970 }, { "epoch": 0.84, "learning_rate": 3.177670032243743e-07, "loss": 1.0318, "step": 27971 }, { "epoch": 0.84, "learning_rate": 3.1764800225688036e-07, "loss": 1.1411, "step": 27972 }, { "epoch": 0.84, "learning_rate": 3.1752902206432565e-07, "loss": 1.1377, "step": 27973 }, { "epoch": 0.84, "learning_rate": 3.174100626478438e-07, "loss": 1.1377, "step": 27974 }, { "epoch": 0.84, "learning_rate": 3.172911240085669e-07, "loss": 1.1857, "step": 27975 }, { "epoch": 0.84, "learning_rate": 3.171722061476271e-07, "loss": 1.0386, "step": 27976 }, { "epoch": 0.84, "learning_rate": 3.1705330906615733e-07, "loss": 1.1161, "step": 27977 }, { "epoch": 0.84, "learning_rate": 3.169344327652882e-07, "loss": 1.0695, "step": 27978 }, { "epoch": 0.84, "learning_rate": 3.1681557724615174e-07, "loss": 1.1572, "step": 27979 }, { "epoch": 0.84, "learning_rate": 3.1669674250987965e-07, "loss": 1.1265, "step": 27980 }, { "epoch": 0.84, "learning_rate": 3.165779285576029e-07, "loss": 0.9874, "step": 27981 }, { "epoch": 0.84, "learning_rate": 3.164591353904528e-07, "loss": 1.0591, "step": 27982 }, { "epoch": 0.84, "learning_rate": 3.163403630095602e-07, "loss": 1.1415, "step": 27983 }, { "epoch": 0.84, "learning_rate": 3.1622161141605547e-07, "loss": 1.0549, "step": 27984 }, { "epoch": 0.84, "learning_rate": 3.1610288061107e-07, "loss": 1.1494, "step": 27985 }, { "epoch": 0.84, "learning_rate": 3.1598417059573255e-07, "loss": 1.1346, "step": 27986 }, { "epoch": 0.84, "learning_rate": 3.1586548137117397e-07, "loss": 1.1801, "step": 27987 }, { "epoch": 0.84, "learning_rate": 3.157468129385241e-07, "loss": 1.0693, "step": 27988 }, { "epoch": 0.84, "learning_rate": 3.156281652989127e-07, "loss": 1.0728, "step": 27989 }, { "epoch": 0.84, "learning_rate": 3.1550953845346953e-07, "loss": 1.1296, "step": 27990 }, { "epoch": 0.84, "learning_rate": 3.15390932403323e-07, "loss": 1.0467, "step": 27991 }, { "epoch": 0.84, "learning_rate": 3.1527234714960273e-07, "loss": 1.062, "step": 27992 }, { "epoch": 0.84, "learning_rate": 3.1515378269343757e-07, "loss": 1.1355, "step": 27993 }, { "epoch": 0.84, "learning_rate": 3.1503523903595653e-07, "loss": 1.1642, "step": 27994 }, { "epoch": 0.84, "learning_rate": 3.149167161782873e-07, "loss": 1.0737, "step": 27995 }, { "epoch": 0.84, "learning_rate": 3.147982141215583e-07, "loss": 1.11, "step": 27996 }, { "epoch": 0.84, "learning_rate": 3.14679732866898e-07, "loss": 1.0153, "step": 27997 }, { "epoch": 0.84, "learning_rate": 3.145612724154348e-07, "loss": 1.0585, "step": 27998 }, { "epoch": 0.84, "learning_rate": 3.1444283276829526e-07, "loss": 1.1321, "step": 27999 }, { "epoch": 0.84, "learning_rate": 3.143244139266072e-07, "loss": 1.1143, "step": 28000 }, { "epoch": 0.84, "learning_rate": 3.1420601589149805e-07, "loss": 1.1266, "step": 28001 }, { "epoch": 0.84, "learning_rate": 3.1408763866409483e-07, "loss": 1.2385, "step": 28002 }, { "epoch": 0.84, "learning_rate": 3.1396928224552535e-07, "loss": 1.0533, "step": 28003 }, { "epoch": 0.84, "learning_rate": 3.138509466369147e-07, "loss": 1.0089, "step": 28004 }, { "epoch": 0.84, "learning_rate": 3.137326318393902e-07, "loss": 1.1998, "step": 28005 }, { "epoch": 0.84, "learning_rate": 3.1361433785407817e-07, "loss": 1.2055, "step": 28006 }, { "epoch": 0.84, "learning_rate": 3.1349606468210447e-07, "loss": 1.098, "step": 28007 }, { "epoch": 0.84, "learning_rate": 3.1337781232459533e-07, "loss": 0.9962, "step": 28008 }, { "epoch": 0.84, "learning_rate": 3.1325958078267634e-07, "loss": 1.0497, "step": 28009 }, { "epoch": 0.84, "learning_rate": 3.131413700574729e-07, "loss": 1.0627, "step": 28010 }, { "epoch": 0.84, "learning_rate": 3.1302318015011073e-07, "loss": 1.1279, "step": 28011 }, { "epoch": 0.84, "learning_rate": 3.129050110617143e-07, "loss": 1.0939, "step": 28012 }, { "epoch": 0.84, "learning_rate": 3.1278686279340886e-07, "loss": 1.0846, "step": 28013 }, { "epoch": 0.84, "learning_rate": 3.1266873534631897e-07, "loss": 1.1572, "step": 28014 }, { "epoch": 0.84, "learning_rate": 3.1255062872156935e-07, "loss": 1.0245, "step": 28015 }, { "epoch": 0.84, "learning_rate": 3.1243254292028484e-07, "loss": 1.0068, "step": 28016 }, { "epoch": 0.84, "learning_rate": 3.1231447794358825e-07, "loss": 1.1128, "step": 28017 }, { "epoch": 0.84, "learning_rate": 3.1219643379260423e-07, "loss": 1.1712, "step": 28018 }, { "epoch": 0.84, "learning_rate": 3.120784104684565e-07, "loss": 1.1489, "step": 28019 }, { "epoch": 0.84, "learning_rate": 3.119604079722691e-07, "loss": 1.1462, "step": 28020 }, { "epoch": 0.84, "learning_rate": 3.118424263051642e-07, "loss": 1.2778, "step": 28021 }, { "epoch": 0.84, "learning_rate": 3.117244654682658e-07, "loss": 1.0411, "step": 28022 }, { "epoch": 0.84, "learning_rate": 3.1160652546269626e-07, "loss": 1.1298, "step": 28023 }, { "epoch": 0.84, "learning_rate": 3.1148860628957946e-07, "loss": 1.0364, "step": 28024 }, { "epoch": 0.84, "learning_rate": 3.113707079500364e-07, "loss": 1.2631, "step": 28025 }, { "epoch": 0.84, "learning_rate": 3.1125283044519007e-07, "loss": 1.1685, "step": 28026 }, { "epoch": 0.84, "learning_rate": 3.111349737761629e-07, "loss": 1.0352, "step": 28027 }, { "epoch": 0.84, "learning_rate": 3.110171379440763e-07, "loss": 1.0295, "step": 28028 }, { "epoch": 0.84, "learning_rate": 3.108993229500529e-07, "loss": 1.1377, "step": 28029 }, { "epoch": 0.84, "learning_rate": 3.107815287952132e-07, "loss": 1.0836, "step": 28030 }, { "epoch": 0.84, "learning_rate": 3.1066375548067904e-07, "loss": 1.2242, "step": 28031 }, { "epoch": 0.84, "learning_rate": 3.105460030075713e-07, "loss": 1.0745, "step": 28032 }, { "epoch": 0.84, "learning_rate": 3.104282713770113e-07, "loss": 1.1165, "step": 28033 }, { "epoch": 0.84, "learning_rate": 3.1031056059011965e-07, "loss": 1.0506, "step": 28034 }, { "epoch": 0.84, "learning_rate": 3.101928706480167e-07, "loss": 1.1257, "step": 28035 }, { "epoch": 0.84, "learning_rate": 3.1007520155182295e-07, "loss": 1.1542, "step": 28036 }, { "epoch": 0.84, "learning_rate": 3.099575533026594e-07, "loss": 1.0015, "step": 28037 }, { "epoch": 0.84, "learning_rate": 3.0983992590164436e-07, "loss": 1.2073, "step": 28038 }, { "epoch": 0.84, "learning_rate": 3.0972231934989856e-07, "loss": 1.1226, "step": 28039 }, { "epoch": 0.84, "learning_rate": 3.096047336485414e-07, "loss": 0.9817, "step": 28040 }, { "epoch": 0.84, "learning_rate": 3.0948716879869225e-07, "loss": 1.1327, "step": 28041 }, { "epoch": 0.84, "learning_rate": 3.0936962480147076e-07, "loss": 1.1753, "step": 28042 }, { "epoch": 0.84, "learning_rate": 3.09252101657995e-07, "loss": 1.1091, "step": 28043 }, { "epoch": 0.84, "learning_rate": 3.0913459936938394e-07, "loss": 1.1404, "step": 28044 }, { "epoch": 0.84, "learning_rate": 3.0901711793675626e-07, "loss": 1.0771, "step": 28045 }, { "epoch": 0.84, "learning_rate": 3.08899657361231e-07, "loss": 1.0786, "step": 28046 }, { "epoch": 0.84, "learning_rate": 3.0878221764392534e-07, "loss": 1.0963, "step": 28047 }, { "epoch": 0.84, "learning_rate": 3.086647987859576e-07, "loss": 1.0471, "step": 28048 }, { "epoch": 0.84, "learning_rate": 3.085474007884456e-07, "loss": 1.0833, "step": 28049 }, { "epoch": 0.85, "learning_rate": 3.0843002365250727e-07, "loss": 1.1519, "step": 28050 }, { "epoch": 0.85, "learning_rate": 3.083126673792594e-07, "loss": 1.148, "step": 28051 }, { "epoch": 0.85, "learning_rate": 3.0819533196981913e-07, "loss": 1.0729, "step": 28052 }, { "epoch": 0.85, "learning_rate": 3.080780174253037e-07, "loss": 1.0291, "step": 28053 }, { "epoch": 0.85, "learning_rate": 3.0796072374683016e-07, "loss": 1.0524, "step": 28054 }, { "epoch": 0.85, "learning_rate": 3.078434509355149e-07, "loss": 1.1837, "step": 28055 }, { "epoch": 0.85, "learning_rate": 3.07726198992474e-07, "loss": 1.0975, "step": 28056 }, { "epoch": 0.85, "learning_rate": 3.0760896791882375e-07, "loss": 1.1211, "step": 28057 }, { "epoch": 0.85, "learning_rate": 3.0749175771568024e-07, "loss": 1.1235, "step": 28058 }, { "epoch": 0.85, "learning_rate": 3.0737456838415976e-07, "loss": 1.1372, "step": 28059 }, { "epoch": 0.85, "learning_rate": 3.0725739992537693e-07, "loss": 1.0845, "step": 28060 }, { "epoch": 0.85, "learning_rate": 3.0714025234044737e-07, "loss": 1.0264, "step": 28061 }, { "epoch": 0.85, "learning_rate": 3.0702312563048676e-07, "loss": 1.1651, "step": 28062 }, { "epoch": 0.85, "learning_rate": 3.0690601979660976e-07, "loss": 1.0203, "step": 28063 }, { "epoch": 0.85, "learning_rate": 3.067889348399311e-07, "loss": 1.0773, "step": 28064 }, { "epoch": 0.85, "learning_rate": 3.0667187076156567e-07, "loss": 1.0975, "step": 28065 }, { "epoch": 0.85, "learning_rate": 3.0655482756262733e-07, "loss": 1.0532, "step": 28066 }, { "epoch": 0.85, "learning_rate": 3.06437805244231e-07, "loss": 1.1826, "step": 28067 }, { "epoch": 0.85, "learning_rate": 3.063208038074908e-07, "loss": 1.0073, "step": 28068 }, { "epoch": 0.85, "learning_rate": 3.062038232535194e-07, "loss": 1.0081, "step": 28069 }, { "epoch": 0.85, "learning_rate": 3.06086863583431e-07, "loss": 1.088, "step": 28070 }, { "epoch": 0.85, "learning_rate": 3.0596992479833916e-07, "loss": 1.191, "step": 28071 }, { "epoch": 0.85, "learning_rate": 3.058530068993573e-07, "loss": 0.9952, "step": 28072 }, { "epoch": 0.85, "learning_rate": 3.0573610988759773e-07, "loss": 1.1183, "step": 28073 }, { "epoch": 0.85, "learning_rate": 3.056192337641736e-07, "loss": 1.1865, "step": 28074 }, { "epoch": 0.85, "learning_rate": 3.055023785301975e-07, "loss": 1.1688, "step": 28075 }, { "epoch": 0.85, "learning_rate": 3.053855441867823e-07, "loss": 1.1147, "step": 28076 }, { "epoch": 0.85, "learning_rate": 3.052687307350391e-07, "loss": 0.9668, "step": 28077 }, { "epoch": 0.85, "learning_rate": 3.051519381760809e-07, "loss": 1.2476, "step": 28078 }, { "epoch": 0.85, "learning_rate": 3.0503516651101876e-07, "loss": 1.0544, "step": 28079 }, { "epoch": 0.85, "learning_rate": 3.0491841574096513e-07, "loss": 1.1953, "step": 28080 }, { "epoch": 0.85, "learning_rate": 3.0480168586703134e-07, "loss": 1.119, "step": 28081 }, { "epoch": 0.85, "learning_rate": 3.046849768903276e-07, "loss": 1.1643, "step": 28082 }, { "epoch": 0.85, "learning_rate": 3.045682888119658e-07, "loss": 1.0573, "step": 28083 }, { "epoch": 0.85, "learning_rate": 3.044516216330565e-07, "loss": 1.1902, "step": 28084 }, { "epoch": 0.85, "learning_rate": 3.0433497535471063e-07, "loss": 1.0936, "step": 28085 }, { "epoch": 0.85, "learning_rate": 3.04218349978038e-07, "loss": 1.1861, "step": 28086 }, { "epoch": 0.85, "learning_rate": 3.041017455041492e-07, "loss": 1.116, "step": 28087 }, { "epoch": 0.85, "learning_rate": 3.0398516193415413e-07, "loss": 1.0013, "step": 28088 }, { "epoch": 0.85, "learning_rate": 3.038685992691626e-07, "loss": 1.1285, "step": 28089 }, { "epoch": 0.85, "learning_rate": 3.037520575102845e-07, "loss": 1.0474, "step": 28090 }, { "epoch": 0.85, "learning_rate": 3.0363553665862883e-07, "loss": 1.0347, "step": 28091 }, { "epoch": 0.85, "learning_rate": 3.035190367153054e-07, "loss": 1.1811, "step": 28092 }, { "epoch": 0.85, "learning_rate": 3.034025576814226e-07, "loss": 1.1254, "step": 28093 }, { "epoch": 0.85, "learning_rate": 3.0328609955808994e-07, "loss": 1.1018, "step": 28094 }, { "epoch": 0.85, "learning_rate": 3.031696623464153e-07, "loss": 1.1348, "step": 28095 }, { "epoch": 0.85, "learning_rate": 3.0305324604750746e-07, "loss": 1.064, "step": 28096 }, { "epoch": 0.85, "learning_rate": 3.029368506624747e-07, "loss": 1.1095, "step": 28097 }, { "epoch": 0.85, "learning_rate": 3.028204761924253e-07, "loss": 1.1265, "step": 28098 }, { "epoch": 0.85, "learning_rate": 3.027041226384664e-07, "loss": 1.152, "step": 28099 }, { "epoch": 0.85, "learning_rate": 3.02587790001706e-07, "loss": 1.1545, "step": 28100 }, { "epoch": 0.85, "learning_rate": 3.0247147828325136e-07, "loss": 1.0806, "step": 28101 }, { "epoch": 0.85, "learning_rate": 3.0235518748421065e-07, "loss": 0.9888, "step": 28102 }, { "epoch": 0.85, "learning_rate": 3.0223891760568946e-07, "loss": 1.0217, "step": 28103 }, { "epoch": 0.85, "learning_rate": 3.0212266864879547e-07, "loss": 1.1685, "step": 28104 }, { "epoch": 0.85, "learning_rate": 3.0200644061463473e-07, "loss": 1.015, "step": 28105 }, { "epoch": 0.85, "learning_rate": 3.018902335043145e-07, "loss": 1.1129, "step": 28106 }, { "epoch": 0.85, "learning_rate": 3.0177404731894094e-07, "loss": 1.046, "step": 28107 }, { "epoch": 0.85, "learning_rate": 3.0165788205961916e-07, "loss": 1.1242, "step": 28108 }, { "epoch": 0.85, "learning_rate": 3.015417377274557e-07, "loss": 1.2508, "step": 28109 }, { "epoch": 0.85, "learning_rate": 3.014256143235561e-07, "loss": 1.1237, "step": 28110 }, { "epoch": 0.85, "learning_rate": 3.013095118490264e-07, "loss": 1.0407, "step": 28111 }, { "epoch": 0.85, "learning_rate": 3.0119343030497047e-07, "loss": 1.2417, "step": 28112 }, { "epoch": 0.85, "learning_rate": 3.010773696924943e-07, "loss": 0.9946, "step": 28113 }, { "epoch": 0.85, "learning_rate": 3.0096133001270234e-07, "loss": 1.1058, "step": 28114 }, { "epoch": 0.85, "learning_rate": 3.0084531126669953e-07, "loss": 1.0358, "step": 28115 }, { "epoch": 0.85, "learning_rate": 3.0072931345559024e-07, "loss": 1.0236, "step": 28116 }, { "epoch": 0.85, "learning_rate": 3.0061333658047863e-07, "loss": 1.0366, "step": 28117 }, { "epoch": 0.85, "learning_rate": 3.004973806424688e-07, "loss": 1.1317, "step": 28118 }, { "epoch": 0.85, "learning_rate": 3.003814456426646e-07, "loss": 1.1576, "step": 28119 }, { "epoch": 0.85, "learning_rate": 3.002655315821701e-07, "loss": 1.139, "step": 28120 }, { "epoch": 0.85, "learning_rate": 3.0014963846208777e-07, "loss": 1.0001, "step": 28121 }, { "epoch": 0.85, "learning_rate": 3.000337662835215e-07, "loss": 1.1055, "step": 28122 }, { "epoch": 0.85, "learning_rate": 2.9991791504757425e-07, "loss": 1.0667, "step": 28123 }, { "epoch": 0.85, "learning_rate": 2.9980208475534953e-07, "loss": 1.0682, "step": 28124 }, { "epoch": 0.85, "learning_rate": 2.9968627540794853e-07, "loss": 1.1515, "step": 28125 }, { "epoch": 0.85, "learning_rate": 2.9957048700647445e-07, "loss": 1.0497, "step": 28126 }, { "epoch": 0.85, "learning_rate": 2.9945471955202976e-07, "loss": 1.0543, "step": 28127 }, { "epoch": 0.85, "learning_rate": 2.993389730457169e-07, "loss": 1.1615, "step": 28128 }, { "epoch": 0.85, "learning_rate": 2.992232474886364e-07, "loss": 1.1188, "step": 28129 }, { "epoch": 0.85, "learning_rate": 2.991075428818907e-07, "loss": 0.9384, "step": 28130 }, { "epoch": 0.85, "learning_rate": 2.9899185922658113e-07, "loss": 1.104, "step": 28131 }, { "epoch": 0.85, "learning_rate": 2.9887619652380936e-07, "loss": 1.1022, "step": 28132 }, { "epoch": 0.85, "learning_rate": 2.987605547746764e-07, "loss": 1.0716, "step": 28133 }, { "epoch": 0.85, "learning_rate": 2.9864493398028217e-07, "loss": 1.1304, "step": 28134 }, { "epoch": 0.85, "learning_rate": 2.985293341417281e-07, "loss": 1.2184, "step": 28135 }, { "epoch": 0.85, "learning_rate": 2.9841375526011434e-07, "loss": 1.2015, "step": 28136 }, { "epoch": 0.85, "learning_rate": 2.98298197336542e-07, "loss": 1.0731, "step": 28137 }, { "epoch": 0.85, "learning_rate": 2.9818266037211e-07, "loss": 1.0999, "step": 28138 }, { "epoch": 0.85, "learning_rate": 2.980671443679184e-07, "loss": 1.0555, "step": 28139 }, { "epoch": 0.85, "learning_rate": 2.9795164932506725e-07, "loss": 1.0602, "step": 28140 }, { "epoch": 0.85, "learning_rate": 2.9783617524465596e-07, "loss": 1.0909, "step": 28141 }, { "epoch": 0.85, "learning_rate": 2.977207221277839e-07, "loss": 1.2069, "step": 28142 }, { "epoch": 0.85, "learning_rate": 2.9760528997554964e-07, "loss": 1.1588, "step": 28143 }, { "epoch": 0.85, "learning_rate": 2.9748987878905236e-07, "loss": 1.1381, "step": 28144 }, { "epoch": 0.85, "learning_rate": 2.9737448856939047e-07, "loss": 1.0516, "step": 28145 }, { "epoch": 0.85, "learning_rate": 2.972591193176627e-07, "loss": 1.1454, "step": 28146 }, { "epoch": 0.85, "learning_rate": 2.9714377103496726e-07, "loss": 1.1255, "step": 28147 }, { "epoch": 0.85, "learning_rate": 2.970284437224022e-07, "loss": 1.0588, "step": 28148 }, { "epoch": 0.85, "learning_rate": 2.969131373810652e-07, "loss": 1.1084, "step": 28149 }, { "epoch": 0.85, "learning_rate": 2.9679785201205487e-07, "loss": 1.0369, "step": 28150 }, { "epoch": 0.85, "learning_rate": 2.9668258761646724e-07, "loss": 1.1824, "step": 28151 }, { "epoch": 0.85, "learning_rate": 2.9656734419540035e-07, "loss": 1.0947, "step": 28152 }, { "epoch": 0.85, "learning_rate": 2.964521217499508e-07, "loss": 1.0737, "step": 28153 }, { "epoch": 0.85, "learning_rate": 2.9633692028121665e-07, "loss": 1.1717, "step": 28154 }, { "epoch": 0.85, "learning_rate": 2.9622173979029307e-07, "loss": 1.2395, "step": 28155 }, { "epoch": 0.85, "learning_rate": 2.96106580278277e-07, "loss": 1.0382, "step": 28156 }, { "epoch": 0.85, "learning_rate": 2.95991441746265e-07, "loss": 1.1346, "step": 28157 }, { "epoch": 0.85, "learning_rate": 2.9587632419535357e-07, "loss": 1.2074, "step": 28158 }, { "epoch": 0.85, "learning_rate": 2.957612276266375e-07, "loss": 1.0839, "step": 28159 }, { "epoch": 0.85, "learning_rate": 2.9564615204121265e-07, "loss": 1.1218, "step": 28160 }, { "epoch": 0.85, "learning_rate": 2.9553109744017513e-07, "loss": 1.1387, "step": 28161 }, { "epoch": 0.85, "learning_rate": 2.954160638246195e-07, "loss": 1.0483, "step": 28162 }, { "epoch": 0.85, "learning_rate": 2.9530105119564196e-07, "loss": 0.9904, "step": 28163 }, { "epoch": 0.85, "learning_rate": 2.95186059554336e-07, "loss": 1.1125, "step": 28164 }, { "epoch": 0.85, "learning_rate": 2.9507108890179684e-07, "loss": 1.0452, "step": 28165 }, { "epoch": 0.85, "learning_rate": 2.94956139239119e-07, "loss": 1.1174, "step": 28166 }, { "epoch": 0.85, "learning_rate": 2.948412105673973e-07, "loss": 1.0324, "step": 28167 }, { "epoch": 0.85, "learning_rate": 2.947263028877248e-07, "loss": 1.2671, "step": 28168 }, { "epoch": 0.85, "learning_rate": 2.9461141620119565e-07, "loss": 0.9808, "step": 28169 }, { "epoch": 0.85, "learning_rate": 2.9449655050890367e-07, "loss": 1.1611, "step": 28170 }, { "epoch": 0.85, "learning_rate": 2.943817058119425e-07, "loss": 1.0605, "step": 28171 }, { "epoch": 0.85, "learning_rate": 2.94266882111405e-07, "loss": 1.1025, "step": 28172 }, { "epoch": 0.85, "learning_rate": 2.9415207940838465e-07, "loss": 1.1418, "step": 28173 }, { "epoch": 0.85, "learning_rate": 2.940372977039738e-07, "loss": 1.1409, "step": 28174 }, { "epoch": 0.85, "learning_rate": 2.939225369992657e-07, "loss": 1.0959, "step": 28175 }, { "epoch": 0.85, "learning_rate": 2.938077972953532e-07, "loss": 1.0675, "step": 28176 }, { "epoch": 0.85, "learning_rate": 2.936930785933273e-07, "loss": 1.0073, "step": 28177 }, { "epoch": 0.85, "learning_rate": 2.9357838089428046e-07, "loss": 1.0732, "step": 28178 }, { "epoch": 0.85, "learning_rate": 2.934637041993052e-07, "loss": 1.1065, "step": 28179 }, { "epoch": 0.85, "learning_rate": 2.933490485094931e-07, "loss": 1.2239, "step": 28180 }, { "epoch": 0.85, "learning_rate": 2.9323441382593463e-07, "loss": 1.1542, "step": 28181 }, { "epoch": 0.85, "learning_rate": 2.931198001497218e-07, "loss": 1.0036, "step": 28182 }, { "epoch": 0.85, "learning_rate": 2.930052074819459e-07, "loss": 1.0504, "step": 28183 }, { "epoch": 0.85, "learning_rate": 2.928906358236977e-07, "loss": 1.0989, "step": 28184 }, { "epoch": 0.85, "learning_rate": 2.927760851760672e-07, "loss": 1.0188, "step": 28185 }, { "epoch": 0.85, "learning_rate": 2.9266155554014545e-07, "loss": 0.9976, "step": 28186 }, { "epoch": 0.85, "learning_rate": 2.9254704691702247e-07, "loss": 1.1287, "step": 28187 }, { "epoch": 0.85, "learning_rate": 2.924325593077884e-07, "loss": 1.0016, "step": 28188 }, { "epoch": 0.85, "learning_rate": 2.9231809271353386e-07, "loss": 1.1458, "step": 28189 }, { "epoch": 0.85, "learning_rate": 2.922036471353473e-07, "loss": 1.0774, "step": 28190 }, { "epoch": 0.85, "learning_rate": 2.9208922257431857e-07, "loss": 1.0683, "step": 28191 }, { "epoch": 0.85, "learning_rate": 2.919748190315372e-07, "loss": 1.0134, "step": 28192 }, { "epoch": 0.85, "learning_rate": 2.918604365080927e-07, "loss": 1.1623, "step": 28193 }, { "epoch": 0.85, "learning_rate": 2.9174607500507267e-07, "loss": 1.1942, "step": 28194 }, { "epoch": 0.85, "learning_rate": 2.9163173452356643e-07, "loss": 1.1013, "step": 28195 }, { "epoch": 0.85, "learning_rate": 2.915174150646627e-07, "loss": 1.1118, "step": 28196 }, { "epoch": 0.85, "learning_rate": 2.9140311662944924e-07, "loss": 1.1407, "step": 28197 }, { "epoch": 0.85, "learning_rate": 2.912888392190147e-07, "loss": 1.0782, "step": 28198 }, { "epoch": 0.85, "learning_rate": 2.911745828344467e-07, "loss": 1.1509, "step": 28199 }, { "epoch": 0.85, "learning_rate": 2.9106034747683254e-07, "loss": 1.2404, "step": 28200 }, { "epoch": 0.85, "learning_rate": 2.9094613314726043e-07, "loss": 1.0649, "step": 28201 }, { "epoch": 0.85, "learning_rate": 2.9083193984681733e-07, "loss": 1.0929, "step": 28202 }, { "epoch": 0.85, "learning_rate": 2.907177675765899e-07, "loss": 1.1238, "step": 28203 }, { "epoch": 0.85, "learning_rate": 2.906036163376652e-07, "loss": 1.027, "step": 28204 }, { "epoch": 0.85, "learning_rate": 2.9048948613113027e-07, "loss": 1.1071, "step": 28205 }, { "epoch": 0.85, "learning_rate": 2.903753769580714e-07, "loss": 1.1077, "step": 28206 }, { "epoch": 0.85, "learning_rate": 2.902612888195744e-07, "loss": 1.0928, "step": 28207 }, { "epoch": 0.85, "learning_rate": 2.901472217167259e-07, "loss": 1.0523, "step": 28208 }, { "epoch": 0.85, "learning_rate": 2.9003317565061113e-07, "loss": 1.0087, "step": 28209 }, { "epoch": 0.85, "learning_rate": 2.89919150622317e-07, "loss": 1.1761, "step": 28210 }, { "epoch": 0.85, "learning_rate": 2.898051466329274e-07, "loss": 1.1418, "step": 28211 }, { "epoch": 0.85, "learning_rate": 2.896911636835287e-07, "loss": 0.9873, "step": 28212 }, { "epoch": 0.85, "learning_rate": 2.8957720177520523e-07, "loss": 1.0245, "step": 28213 }, { "epoch": 0.85, "learning_rate": 2.8946326090904255e-07, "loss": 1.2134, "step": 28214 }, { "epoch": 0.85, "learning_rate": 2.8934934108612533e-07, "loss": 1.0551, "step": 28215 }, { "epoch": 0.85, "learning_rate": 2.892354423075369e-07, "loss": 1.0933, "step": 28216 }, { "epoch": 0.85, "learning_rate": 2.891215645743628e-07, "loss": 1.2004, "step": 28217 }, { "epoch": 0.85, "learning_rate": 2.890077078876863e-07, "loss": 1.2139, "step": 28218 }, { "epoch": 0.85, "learning_rate": 2.888938722485923e-07, "loss": 1.0839, "step": 28219 }, { "epoch": 0.85, "learning_rate": 2.8878005765816315e-07, "loss": 1.1042, "step": 28220 }, { "epoch": 0.85, "learning_rate": 2.8866626411748284e-07, "loss": 1.1448, "step": 28221 }, { "epoch": 0.85, "learning_rate": 2.885524916276347e-07, "loss": 1.025, "step": 28222 }, { "epoch": 0.85, "learning_rate": 2.884387401897018e-07, "loss": 1.0132, "step": 28223 }, { "epoch": 0.85, "learning_rate": 2.883250098047674e-07, "loss": 1.1605, "step": 28224 }, { "epoch": 0.85, "learning_rate": 2.8821130047391315e-07, "loss": 1.0558, "step": 28225 }, { "epoch": 0.85, "learning_rate": 2.8809761219822234e-07, "loss": 1.1545, "step": 28226 }, { "epoch": 0.85, "learning_rate": 2.879839449787766e-07, "loss": 1.0895, "step": 28227 }, { "epoch": 0.85, "learning_rate": 2.8787029881665873e-07, "loss": 1.1053, "step": 28228 }, { "epoch": 0.85, "learning_rate": 2.8775667371295e-07, "loss": 1.1146, "step": 28229 }, { "epoch": 0.85, "learning_rate": 2.876430696687324e-07, "loss": 1.1732, "step": 28230 }, { "epoch": 0.85, "learning_rate": 2.8752948668508726e-07, "loss": 1.0701, "step": 28231 }, { "epoch": 0.85, "learning_rate": 2.8741592476309616e-07, "loss": 1.0735, "step": 28232 }, { "epoch": 0.85, "learning_rate": 2.873023839038397e-07, "loss": 1.0452, "step": 28233 }, { "epoch": 0.85, "learning_rate": 2.8718886410839865e-07, "loss": 1.053, "step": 28234 }, { "epoch": 0.85, "learning_rate": 2.870753653778538e-07, "loss": 1.1575, "step": 28235 }, { "epoch": 0.85, "learning_rate": 2.8696188771328627e-07, "loss": 1.162, "step": 28236 }, { "epoch": 0.85, "learning_rate": 2.868484311157754e-07, "loss": 1.1573, "step": 28237 }, { "epoch": 0.85, "learning_rate": 2.8673499558640127e-07, "loss": 1.0412, "step": 28238 }, { "epoch": 0.85, "learning_rate": 2.866215811262443e-07, "loss": 1.0794, "step": 28239 }, { "epoch": 0.85, "learning_rate": 2.8650818773638374e-07, "loss": 1.1053, "step": 28240 }, { "epoch": 0.85, "learning_rate": 2.863948154178997e-07, "loss": 1.1133, "step": 28241 }, { "epoch": 0.85, "learning_rate": 2.8628146417187057e-07, "loss": 1.2199, "step": 28242 }, { "epoch": 0.85, "learning_rate": 2.861681339993755e-07, "loss": 1.0455, "step": 28243 }, { "epoch": 0.85, "learning_rate": 2.8605482490149354e-07, "loss": 1.0856, "step": 28244 }, { "epoch": 0.85, "learning_rate": 2.859415368793042e-07, "loss": 0.9975, "step": 28245 }, { "epoch": 0.85, "learning_rate": 2.8582826993388435e-07, "loss": 1.0355, "step": 28246 }, { "epoch": 0.85, "learning_rate": 2.8571502406631315e-07, "loss": 1.0546, "step": 28247 }, { "epoch": 0.85, "learning_rate": 2.856017992776683e-07, "loss": 1.1739, "step": 28248 }, { "epoch": 0.85, "learning_rate": 2.854885955690284e-07, "loss": 1.1338, "step": 28249 }, { "epoch": 0.85, "learning_rate": 2.853754129414699e-07, "loss": 1.0829, "step": 28250 }, { "epoch": 0.85, "learning_rate": 2.852622513960709e-07, "loss": 1.0977, "step": 28251 }, { "epoch": 0.85, "learning_rate": 2.8514911093390886e-07, "loss": 1.0366, "step": 28252 }, { "epoch": 0.85, "learning_rate": 2.850359915560605e-07, "loss": 0.9763, "step": 28253 }, { "epoch": 0.85, "learning_rate": 2.8492289326360253e-07, "loss": 1.0554, "step": 28254 }, { "epoch": 0.85, "learning_rate": 2.848098160576121e-07, "loss": 1.1567, "step": 28255 }, { "epoch": 0.85, "learning_rate": 2.846967599391651e-07, "loss": 1.0314, "step": 28256 }, { "epoch": 0.85, "learning_rate": 2.845837249093381e-07, "loss": 1.0826, "step": 28257 }, { "epoch": 0.85, "learning_rate": 2.844707109692077e-07, "loss": 1.1068, "step": 28258 }, { "epoch": 0.85, "learning_rate": 2.843577181198484e-07, "loss": 1.0549, "step": 28259 }, { "epoch": 0.85, "learning_rate": 2.842447463623366e-07, "loss": 1.1876, "step": 28260 }, { "epoch": 0.85, "learning_rate": 2.8413179569774767e-07, "loss": 1.2665, "step": 28261 }, { "epoch": 0.85, "learning_rate": 2.840188661271573e-07, "loss": 1.2118, "step": 28262 }, { "epoch": 0.85, "learning_rate": 2.8390595765163955e-07, "loss": 1.1055, "step": 28263 }, { "epoch": 0.85, "learning_rate": 2.8379307027226995e-07, "loss": 1.1274, "step": 28264 }, { "epoch": 0.85, "learning_rate": 2.8368020399012265e-07, "loss": 1.1735, "step": 28265 }, { "epoch": 0.85, "learning_rate": 2.835673588062726e-07, "loss": 1.1011, "step": 28266 }, { "epoch": 0.85, "learning_rate": 2.834545347217943e-07, "loss": 1.1335, "step": 28267 }, { "epoch": 0.85, "learning_rate": 2.8334173173776096e-07, "loss": 1.0361, "step": 28268 }, { "epoch": 0.85, "learning_rate": 2.832289498552465e-07, "loss": 1.0476, "step": 28269 }, { "epoch": 0.85, "learning_rate": 2.831161890753248e-07, "loss": 1.1401, "step": 28270 }, { "epoch": 0.85, "learning_rate": 2.8300344939906994e-07, "loss": 1.096, "step": 28271 }, { "epoch": 0.85, "learning_rate": 2.828907308275541e-07, "loss": 1.0413, "step": 28272 }, { "epoch": 0.85, "learning_rate": 2.8277803336185047e-07, "loss": 1.1895, "step": 28273 }, { "epoch": 0.85, "learning_rate": 2.8266535700303213e-07, "loss": 1.0902, "step": 28274 }, { "epoch": 0.85, "learning_rate": 2.825527017521723e-07, "loss": 1.1017, "step": 28275 }, { "epoch": 0.85, "learning_rate": 2.8244006761034225e-07, "loss": 1.0261, "step": 28276 }, { "epoch": 0.85, "learning_rate": 2.8232745457861476e-07, "loss": 1.074, "step": 28277 }, { "epoch": 0.85, "learning_rate": 2.82214862658062e-07, "loss": 1.1012, "step": 28278 }, { "epoch": 0.85, "learning_rate": 2.821022918497554e-07, "loss": 1.0415, "step": 28279 }, { "epoch": 0.85, "learning_rate": 2.819897421547668e-07, "loss": 1.0534, "step": 28280 }, { "epoch": 0.85, "learning_rate": 2.818772135741676e-07, "loss": 1.185, "step": 28281 }, { "epoch": 0.85, "learning_rate": 2.817647061090292e-07, "loss": 1.1118, "step": 28282 }, { "epoch": 0.85, "learning_rate": 2.816522197604224e-07, "loss": 1.051, "step": 28283 }, { "epoch": 0.85, "learning_rate": 2.815397545294185e-07, "loss": 1.0241, "step": 28284 }, { "epoch": 0.85, "learning_rate": 2.8142731041708726e-07, "loss": 1.0942, "step": 28285 }, { "epoch": 0.85, "learning_rate": 2.8131488742449947e-07, "loss": 1.1871, "step": 28286 }, { "epoch": 0.85, "learning_rate": 2.812024855527254e-07, "loss": 1.1389, "step": 28287 }, { "epoch": 0.85, "learning_rate": 2.810901048028358e-07, "loss": 1.0977, "step": 28288 }, { "epoch": 0.85, "learning_rate": 2.809777451758988e-07, "loss": 1.0775, "step": 28289 }, { "epoch": 0.85, "learning_rate": 2.808654066729855e-07, "loss": 1.108, "step": 28290 }, { "epoch": 0.85, "learning_rate": 2.807530892951643e-07, "loss": 1.1036, "step": 28291 }, { "epoch": 0.85, "learning_rate": 2.8064079304350485e-07, "loss": 1.0631, "step": 28292 }, { "epoch": 0.85, "learning_rate": 2.8052851791907697e-07, "loss": 0.9991, "step": 28293 }, { "epoch": 0.85, "learning_rate": 2.8041626392294797e-07, "loss": 1.0722, "step": 28294 }, { "epoch": 0.85, "learning_rate": 2.803040310561872e-07, "loss": 1.1161, "step": 28295 }, { "epoch": 0.85, "learning_rate": 2.80191819319863e-07, "loss": 1.0817, "step": 28296 }, { "epoch": 0.85, "learning_rate": 2.8007962871504423e-07, "loss": 1.0039, "step": 28297 }, { "epoch": 0.85, "learning_rate": 2.799674592427976e-07, "loss": 1.1117, "step": 28298 }, { "epoch": 0.85, "learning_rate": 2.798553109041915e-07, "loss": 1.136, "step": 28299 }, { "epoch": 0.85, "learning_rate": 2.797431837002937e-07, "loss": 1.0126, "step": 28300 }, { "epoch": 0.85, "learning_rate": 2.796310776321717e-07, "loss": 1.1445, "step": 28301 }, { "epoch": 0.85, "learning_rate": 2.7951899270089234e-07, "loss": 1.1525, "step": 28302 }, { "epoch": 0.85, "learning_rate": 2.794069289075224e-07, "loss": 1.066, "step": 28303 }, { "epoch": 0.85, "learning_rate": 2.7929488625312944e-07, "loss": 1.1451, "step": 28304 }, { "epoch": 0.85, "learning_rate": 2.791828647387793e-07, "loss": 1.2478, "step": 28305 }, { "epoch": 0.85, "learning_rate": 2.790708643655393e-07, "loss": 1.1725, "step": 28306 }, { "epoch": 0.85, "learning_rate": 2.789588851344746e-07, "loss": 1.0969, "step": 28307 }, { "epoch": 0.85, "learning_rate": 2.788469270466515e-07, "loss": 1.1281, "step": 28308 }, { "epoch": 0.85, "learning_rate": 2.787349901031361e-07, "loss": 1.1357, "step": 28309 }, { "epoch": 0.85, "learning_rate": 2.786230743049936e-07, "loss": 1.1242, "step": 28310 }, { "epoch": 0.85, "learning_rate": 2.785111796532897e-07, "loss": 1.2654, "step": 28311 }, { "epoch": 0.85, "learning_rate": 2.783993061490894e-07, "loss": 1.1215, "step": 28312 }, { "epoch": 0.85, "learning_rate": 2.7828745379345797e-07, "loss": 1.0851, "step": 28313 }, { "epoch": 0.85, "learning_rate": 2.7817562258746014e-07, "loss": 1.261, "step": 28314 }, { "epoch": 0.85, "learning_rate": 2.7806381253216e-07, "loss": 1.0957, "step": 28315 }, { "epoch": 0.85, "learning_rate": 2.7795202362862233e-07, "loss": 1.1107, "step": 28316 }, { "epoch": 0.85, "learning_rate": 2.778402558779109e-07, "loss": 1.084, "step": 28317 }, { "epoch": 0.85, "learning_rate": 2.7772850928109024e-07, "loss": 1.0944, "step": 28318 }, { "epoch": 0.85, "learning_rate": 2.7761678383922436e-07, "loss": 0.9783, "step": 28319 }, { "epoch": 0.85, "learning_rate": 2.77505079553376e-07, "loss": 1.1199, "step": 28320 }, { "epoch": 0.85, "learning_rate": 2.773933964246087e-07, "loss": 1.1178, "step": 28321 }, { "epoch": 0.85, "learning_rate": 2.772817344539858e-07, "loss": 1.0913, "step": 28322 }, { "epoch": 0.85, "learning_rate": 2.7717009364257085e-07, "loss": 1.2252, "step": 28323 }, { "epoch": 0.85, "learning_rate": 2.770584739914256e-07, "loss": 1.1898, "step": 28324 }, { "epoch": 0.85, "learning_rate": 2.76946875501613e-07, "loss": 1.1826, "step": 28325 }, { "epoch": 0.85, "learning_rate": 2.7683529817419537e-07, "loss": 1.0711, "step": 28326 }, { "epoch": 0.85, "learning_rate": 2.767237420102356e-07, "loss": 1.1523, "step": 28327 }, { "epoch": 0.85, "learning_rate": 2.766122070107946e-07, "loss": 1.1443, "step": 28328 }, { "epoch": 0.85, "learning_rate": 2.765006931769346e-07, "loss": 1.1931, "step": 28329 }, { "epoch": 0.85, "learning_rate": 2.763892005097171e-07, "loss": 1.0569, "step": 28330 }, { "epoch": 0.85, "learning_rate": 2.7627772901020394e-07, "loss": 1.0515, "step": 28331 }, { "epoch": 0.85, "learning_rate": 2.761662786794553e-07, "loss": 1.1401, "step": 28332 }, { "epoch": 0.85, "learning_rate": 2.7605484951853277e-07, "loss": 1.0821, "step": 28333 }, { "epoch": 0.85, "learning_rate": 2.7594344152849674e-07, "loss": 1.0034, "step": 28334 }, { "epoch": 0.85, "learning_rate": 2.758320547104082e-07, "loss": 1.0344, "step": 28335 }, { "epoch": 0.85, "learning_rate": 2.757206890653272e-07, "loss": 1.1744, "step": 28336 }, { "epoch": 0.85, "learning_rate": 2.7560934459431423e-07, "loss": 1.0428, "step": 28337 }, { "epoch": 0.85, "learning_rate": 2.7549802129842873e-07, "loss": 1.135, "step": 28338 }, { "epoch": 0.85, "learning_rate": 2.753867191787307e-07, "loss": 1.0084, "step": 28339 }, { "epoch": 0.85, "learning_rate": 2.7527543823628046e-07, "loss": 1.1442, "step": 28340 }, { "epoch": 0.85, "learning_rate": 2.7516417847213595e-07, "loss": 1.0473, "step": 28341 }, { "epoch": 0.85, "learning_rate": 2.7505293988735694e-07, "loss": 1.079, "step": 28342 }, { "epoch": 0.85, "learning_rate": 2.7494172248300227e-07, "loss": 1.1132, "step": 28343 }, { "epoch": 0.85, "learning_rate": 2.748305262601314e-07, "loss": 1.0717, "step": 28344 }, { "epoch": 0.85, "learning_rate": 2.7471935121980155e-07, "loss": 1.1098, "step": 28345 }, { "epoch": 0.85, "learning_rate": 2.746081973630718e-07, "loss": 1.1589, "step": 28346 }, { "epoch": 0.85, "learning_rate": 2.744970646910003e-07, "loss": 1.0566, "step": 28347 }, { "epoch": 0.85, "learning_rate": 2.74385953204645e-07, "loss": 1.0986, "step": 28348 }, { "epoch": 0.85, "learning_rate": 2.74274862905064e-07, "loss": 1.0492, "step": 28349 }, { "epoch": 0.85, "learning_rate": 2.7416379379331365e-07, "loss": 1.0141, "step": 28350 }, { "epoch": 0.85, "learning_rate": 2.740527458704523e-07, "loss": 1.1201, "step": 28351 }, { "epoch": 0.85, "learning_rate": 2.739417191375365e-07, "loss": 1.1504, "step": 28352 }, { "epoch": 0.85, "learning_rate": 2.738307135956242e-07, "loss": 1.0784, "step": 28353 }, { "epoch": 0.85, "learning_rate": 2.737197292457705e-07, "loss": 1.0444, "step": 28354 }, { "epoch": 0.85, "learning_rate": 2.7360876608903295e-07, "loss": 1.1512, "step": 28355 }, { "epoch": 0.85, "learning_rate": 2.734978241264677e-07, "loss": 1.045, "step": 28356 }, { "epoch": 0.85, "learning_rate": 2.733869033591313e-07, "loss": 1.0175, "step": 28357 }, { "epoch": 0.85, "learning_rate": 2.7327600378807885e-07, "loss": 1.192, "step": 28358 }, { "epoch": 0.85, "learning_rate": 2.731651254143661e-07, "loss": 1.069, "step": 28359 }, { "epoch": 0.85, "learning_rate": 2.730542682390491e-07, "loss": 1.0858, "step": 28360 }, { "epoch": 0.85, "learning_rate": 2.72943432263183e-07, "loss": 1.1276, "step": 28361 }, { "epoch": 0.85, "learning_rate": 2.7283261748782264e-07, "loss": 1.067, "step": 28362 }, { "epoch": 0.85, "learning_rate": 2.7272182391402305e-07, "loss": 1.1323, "step": 28363 }, { "epoch": 0.85, "learning_rate": 2.726110515428393e-07, "loss": 1.0769, "step": 28364 }, { "epoch": 0.85, "learning_rate": 2.7250030037532545e-07, "loss": 1.0825, "step": 28365 }, { "epoch": 0.85, "learning_rate": 2.723895704125365e-07, "loss": 1.0468, "step": 28366 }, { "epoch": 0.85, "learning_rate": 2.7227886165552525e-07, "loss": 1.1868, "step": 28367 }, { "epoch": 0.85, "learning_rate": 2.721681741053467e-07, "loss": 1.0109, "step": 28368 }, { "epoch": 0.85, "learning_rate": 2.7205750776305384e-07, "loss": 1.13, "step": 28369 }, { "epoch": 0.85, "learning_rate": 2.719468626297012e-07, "loss": 1.1919, "step": 28370 }, { "epoch": 0.85, "learning_rate": 2.7183623870634087e-07, "loss": 1.0938, "step": 28371 }, { "epoch": 0.85, "learning_rate": 2.7172563599402626e-07, "loss": 1.1022, "step": 28372 }, { "epoch": 0.85, "learning_rate": 2.716150544938106e-07, "loss": 1.0262, "step": 28373 }, { "epoch": 0.85, "learning_rate": 2.715044942067463e-07, "loss": 1.1057, "step": 28374 }, { "epoch": 0.85, "learning_rate": 2.713939551338865e-07, "loss": 1.0918, "step": 28375 }, { "epoch": 0.85, "learning_rate": 2.712834372762821e-07, "loss": 1.1102, "step": 28376 }, { "epoch": 0.85, "learning_rate": 2.711729406349864e-07, "loss": 1.0894, "step": 28377 }, { "epoch": 0.85, "learning_rate": 2.710624652110508e-07, "loss": 1.039, "step": 28378 }, { "epoch": 0.85, "learning_rate": 2.709520110055272e-07, "loss": 1.0624, "step": 28379 }, { "epoch": 0.85, "learning_rate": 2.7084157801946674e-07, "loss": 1.0626, "step": 28380 }, { "epoch": 0.85, "learning_rate": 2.707311662539208e-07, "loss": 1.1609, "step": 28381 }, { "epoch": 0.86, "learning_rate": 2.706207757099405e-07, "loss": 1.1234, "step": 28382 }, { "epoch": 0.86, "learning_rate": 2.7051040638857715e-07, "loss": 1.1, "step": 28383 }, { "epoch": 0.86, "learning_rate": 2.704000582908806e-07, "loss": 1.1439, "step": 28384 }, { "epoch": 0.86, "learning_rate": 2.702897314179015e-07, "loss": 1.2351, "step": 28385 }, { "epoch": 0.86, "learning_rate": 2.701794257706905e-07, "loss": 1.1774, "step": 28386 }, { "epoch": 0.86, "learning_rate": 2.7006914135029735e-07, "loss": 1.1166, "step": 28387 }, { "epoch": 0.86, "learning_rate": 2.6995887815777193e-07, "loss": 1.112, "step": 28388 }, { "epoch": 0.86, "learning_rate": 2.6984863619416433e-07, "loss": 1.1216, "step": 28389 }, { "epoch": 0.86, "learning_rate": 2.6973841546052345e-07, "loss": 1.2246, "step": 28390 }, { "epoch": 0.86, "learning_rate": 2.696282159578986e-07, "loss": 1.1037, "step": 28391 }, { "epoch": 0.86, "learning_rate": 2.695180376873391e-07, "loss": 1.1114, "step": 28392 }, { "epoch": 0.86, "learning_rate": 2.694078806498934e-07, "loss": 1.1157, "step": 28393 }, { "epoch": 0.86, "learning_rate": 2.692977448466105e-07, "loss": 1.0534, "step": 28394 }, { "epoch": 0.86, "learning_rate": 2.691876302785387e-07, "loss": 1.0154, "step": 28395 }, { "epoch": 0.86, "learning_rate": 2.690775369467266e-07, "loss": 1.1304, "step": 28396 }, { "epoch": 0.86, "learning_rate": 2.689674648522217e-07, "loss": 1.0597, "step": 28397 }, { "epoch": 0.86, "learning_rate": 2.68857413996072e-07, "loss": 1.0219, "step": 28398 }, { "epoch": 0.86, "learning_rate": 2.687473843793251e-07, "loss": 1.1352, "step": 28399 }, { "epoch": 0.86, "learning_rate": 2.6863737600302837e-07, "loss": 1.075, "step": 28400 }, { "epoch": 0.86, "learning_rate": 2.6852738886822967e-07, "loss": 0.9876, "step": 28401 }, { "epoch": 0.86, "learning_rate": 2.6841742297597506e-07, "loss": 1.0868, "step": 28402 }, { "epoch": 0.86, "learning_rate": 2.683074783273118e-07, "loss": 1.0755, "step": 28403 }, { "epoch": 0.86, "learning_rate": 2.681975549232865e-07, "loss": 1.137, "step": 28404 }, { "epoch": 0.86, "learning_rate": 2.680876527649465e-07, "loss": 1.1743, "step": 28405 }, { "epoch": 0.86, "learning_rate": 2.6797777185333605e-07, "loss": 1.0547, "step": 28406 }, { "epoch": 0.86, "learning_rate": 2.678679121895025e-07, "loss": 1.1589, "step": 28407 }, { "epoch": 0.86, "learning_rate": 2.677580737744914e-07, "loss": 1.212, "step": 28408 }, { "epoch": 0.86, "learning_rate": 2.6764825660934885e-07, "loss": 1.0698, "step": 28409 }, { "epoch": 0.86, "learning_rate": 2.6753846069511923e-07, "loss": 1.0972, "step": 28410 }, { "epoch": 0.86, "learning_rate": 2.674286860328484e-07, "loss": 1.2137, "step": 28411 }, { "epoch": 0.86, "learning_rate": 2.673189326235812e-07, "loss": 1.1067, "step": 28412 }, { "epoch": 0.86, "learning_rate": 2.6720920046836213e-07, "loss": 1.213, "step": 28413 }, { "epoch": 0.86, "learning_rate": 2.6709948956823687e-07, "loss": 1.0931, "step": 28414 }, { "epoch": 0.86, "learning_rate": 2.669897999242488e-07, "loss": 1.1169, "step": 28415 }, { "epoch": 0.86, "learning_rate": 2.6688013153744195e-07, "loss": 1.1487, "step": 28416 }, { "epoch": 0.86, "learning_rate": 2.667704844088609e-07, "loss": 1.0715, "step": 28417 }, { "epoch": 0.86, "learning_rate": 2.666608585395494e-07, "loss": 1.1854, "step": 28418 }, { "epoch": 0.86, "learning_rate": 2.6655125393055093e-07, "loss": 1.0474, "step": 28419 }, { "epoch": 0.86, "learning_rate": 2.664416705829087e-07, "loss": 1.1061, "step": 28420 }, { "epoch": 0.86, "learning_rate": 2.663321084976661e-07, "loss": 1.0587, "step": 28421 }, { "epoch": 0.86, "learning_rate": 2.6622256767586644e-07, "loss": 1.0261, "step": 28422 }, { "epoch": 0.86, "learning_rate": 2.66113048118552e-07, "loss": 1.1084, "step": 28423 }, { "epoch": 0.86, "learning_rate": 2.660035498267652e-07, "loss": 1.0898, "step": 28424 }, { "epoch": 0.86, "learning_rate": 2.6589407280154856e-07, "loss": 1.1225, "step": 28425 }, { "epoch": 0.86, "learning_rate": 2.657846170439446e-07, "loss": 1.1242, "step": 28426 }, { "epoch": 0.86, "learning_rate": 2.6567518255499523e-07, "loss": 1.0891, "step": 28427 }, { "epoch": 0.86, "learning_rate": 2.655657693357419e-07, "loss": 1.1036, "step": 28428 }, { "epoch": 0.86, "learning_rate": 2.6545637738722596e-07, "loss": 1.1605, "step": 28429 }, { "epoch": 0.86, "learning_rate": 2.6534700671048935e-07, "loss": 1.1243, "step": 28430 }, { "epoch": 0.86, "learning_rate": 2.6523765730657345e-07, "loss": 1.1282, "step": 28431 }, { "epoch": 0.86, "learning_rate": 2.651283291765183e-07, "loss": 1.1268, "step": 28432 }, { "epoch": 0.86, "learning_rate": 2.65019022321365e-07, "loss": 1.1452, "step": 28433 }, { "epoch": 0.86, "learning_rate": 2.649097367421544e-07, "loss": 1.0417, "step": 28434 }, { "epoch": 0.86, "learning_rate": 2.6480047243992695e-07, "loss": 0.9905, "step": 28435 }, { "epoch": 0.86, "learning_rate": 2.6469122941572195e-07, "loss": 1.0593, "step": 28436 }, { "epoch": 0.86, "learning_rate": 2.645820076705799e-07, "loss": 1.2992, "step": 28437 }, { "epoch": 0.86, "learning_rate": 2.644728072055408e-07, "loss": 1.0358, "step": 28438 }, { "epoch": 0.86, "learning_rate": 2.6436362802164354e-07, "loss": 1.075, "step": 28439 }, { "epoch": 0.86, "learning_rate": 2.6425447011992845e-07, "loss": 1.1323, "step": 28440 }, { "epoch": 0.86, "learning_rate": 2.6414533350143377e-07, "loss": 1.0972, "step": 28441 }, { "epoch": 0.86, "learning_rate": 2.640362181671985e-07, "loss": 1.1071, "step": 28442 }, { "epoch": 0.86, "learning_rate": 2.639271241182614e-07, "loss": 1.0605, "step": 28443 }, { "epoch": 0.86, "learning_rate": 2.6381805135566126e-07, "loss": 1.0877, "step": 28444 }, { "epoch": 0.86, "learning_rate": 2.6370899988043653e-07, "loss": 1.1071, "step": 28445 }, { "epoch": 0.86, "learning_rate": 2.635999696936248e-07, "loss": 1.0847, "step": 28446 }, { "epoch": 0.86, "learning_rate": 2.6349096079626436e-07, "loss": 1.1149, "step": 28447 }, { "epoch": 0.86, "learning_rate": 2.633819731893933e-07, "loss": 1.1225, "step": 28448 }, { "epoch": 0.86, "learning_rate": 2.6327300687404827e-07, "loss": 1.1699, "step": 28449 }, { "epoch": 0.86, "learning_rate": 2.631640618512668e-07, "loss": 1.1726, "step": 28450 }, { "epoch": 0.86, "learning_rate": 2.6305513812208637e-07, "loss": 1.1536, "step": 28451 }, { "epoch": 0.86, "learning_rate": 2.6294623568754343e-07, "loss": 1.1075, "step": 28452 }, { "epoch": 0.86, "learning_rate": 2.628373545486756e-07, "loss": 1.1112, "step": 28453 }, { "epoch": 0.86, "learning_rate": 2.6272849470651814e-07, "loss": 1.1683, "step": 28454 }, { "epoch": 0.86, "learning_rate": 2.6261965616210805e-07, "loss": 1.1627, "step": 28455 }, { "epoch": 0.86, "learning_rate": 2.62510838916481e-07, "loss": 1.1482, "step": 28456 }, { "epoch": 0.86, "learning_rate": 2.624020429706739e-07, "loss": 1.0137, "step": 28457 }, { "epoch": 0.86, "learning_rate": 2.6229326832572096e-07, "loss": 1.0238, "step": 28458 }, { "epoch": 0.86, "learning_rate": 2.621845149826585e-07, "loss": 1.1207, "step": 28459 }, { "epoch": 0.86, "learning_rate": 2.620757829425216e-07, "loss": 1.1182, "step": 28460 }, { "epoch": 0.86, "learning_rate": 2.619670722063461e-07, "loss": 1.0438, "step": 28461 }, { "epoch": 0.86, "learning_rate": 2.618583827751656e-07, "loss": 1.1637, "step": 28462 }, { "epoch": 0.86, "learning_rate": 2.6174971465001556e-07, "loss": 1.1274, "step": 28463 }, { "epoch": 0.86, "learning_rate": 2.6164106783193004e-07, "loss": 1.1376, "step": 28464 }, { "epoch": 0.86, "learning_rate": 2.615324423219434e-07, "loss": 1.0325, "step": 28465 }, { "epoch": 0.86, "learning_rate": 2.614238381210907e-07, "loss": 1.0216, "step": 28466 }, { "epoch": 0.86, "learning_rate": 2.613152552304041e-07, "loss": 1.1293, "step": 28467 }, { "epoch": 0.86, "learning_rate": 2.612066936509183e-07, "loss": 1.0905, "step": 28468 }, { "epoch": 0.86, "learning_rate": 2.610981533836665e-07, "loss": 1.104, "step": 28469 }, { "epoch": 0.86, "learning_rate": 2.609896344296819e-07, "loss": 1.1121, "step": 28470 }, { "epoch": 0.86, "learning_rate": 2.6088113678999797e-07, "loss": 1.0836, "step": 28471 }, { "epoch": 0.86, "learning_rate": 2.6077266046564714e-07, "loss": 1.088, "step": 28472 }, { "epoch": 0.86, "learning_rate": 2.606642054576619e-07, "loss": 1.1672, "step": 28473 }, { "epoch": 0.86, "learning_rate": 2.605557717670748e-07, "loss": 1.0335, "step": 28474 }, { "epoch": 0.86, "learning_rate": 2.6044735939491835e-07, "loss": 1.0758, "step": 28475 }, { "epoch": 0.86, "learning_rate": 2.603389683422244e-07, "loss": 1.0436, "step": 28476 }, { "epoch": 0.86, "learning_rate": 2.602305986100248e-07, "loss": 1.0144, "step": 28477 }, { "epoch": 0.86, "learning_rate": 2.601222501993514e-07, "loss": 1.0676, "step": 28478 }, { "epoch": 0.86, "learning_rate": 2.600139231112356e-07, "loss": 1.0577, "step": 28479 }, { "epoch": 0.86, "learning_rate": 2.599056173467082e-07, "loss": 1.1077, "step": 28480 }, { "epoch": 0.86, "learning_rate": 2.5979733290680043e-07, "loss": 1.0814, "step": 28481 }, { "epoch": 0.86, "learning_rate": 2.5968906979254303e-07, "loss": 1.0536, "step": 28482 }, { "epoch": 0.86, "learning_rate": 2.595808280049672e-07, "loss": 1.0604, "step": 28483 }, { "epoch": 0.86, "learning_rate": 2.5947260754510235e-07, "loss": 1.0695, "step": 28484 }, { "epoch": 0.86, "learning_rate": 2.593644084139793e-07, "loss": 0.9882, "step": 28485 }, { "epoch": 0.86, "learning_rate": 2.5925623061262784e-07, "loss": 1.1802, "step": 28486 }, { "epoch": 0.86, "learning_rate": 2.591480741420785e-07, "loss": 1.278, "step": 28487 }, { "epoch": 0.86, "learning_rate": 2.590399390033596e-07, "loss": 1.0438, "step": 28488 }, { "epoch": 0.86, "learning_rate": 2.589318251975012e-07, "loss": 1.115, "step": 28489 }, { "epoch": 0.86, "learning_rate": 2.5882373272553276e-07, "loss": 1.0858, "step": 28490 }, { "epoch": 0.86, "learning_rate": 2.587156615884828e-07, "loss": 1.1956, "step": 28491 }, { "epoch": 0.86, "learning_rate": 2.586076117873806e-07, "loss": 1.1202, "step": 28492 }, { "epoch": 0.86, "learning_rate": 2.5849958332325426e-07, "loss": 1.2181, "step": 28493 }, { "epoch": 0.86, "learning_rate": 2.583915761971323e-07, "loss": 1.0346, "step": 28494 }, { "epoch": 0.86, "learning_rate": 2.582835904100428e-07, "loss": 1.1202, "step": 28495 }, { "epoch": 0.86, "learning_rate": 2.5817562596301443e-07, "loss": 1.1014, "step": 28496 }, { "epoch": 0.86, "learning_rate": 2.5806768285707414e-07, "loss": 1.1692, "step": 28497 }, { "epoch": 0.86, "learning_rate": 2.579597610932494e-07, "loss": 1.0184, "step": 28498 }, { "epoch": 0.86, "learning_rate": 2.57851860672568e-07, "loss": 1.1912, "step": 28499 }, { "epoch": 0.86, "learning_rate": 2.577439815960572e-07, "loss": 1.1561, "step": 28500 }, { "epoch": 0.86, "learning_rate": 2.5763612386474376e-07, "loss": 1.0332, "step": 28501 }, { "epoch": 0.86, "learning_rate": 2.5752828747965447e-07, "loss": 0.9838, "step": 28502 }, { "epoch": 0.86, "learning_rate": 2.5742047244181583e-07, "loss": 1.1113, "step": 28503 }, { "epoch": 0.86, "learning_rate": 2.573126787522545e-07, "loss": 1.062, "step": 28504 }, { "epoch": 0.86, "learning_rate": 2.572049064119961e-07, "loss": 1.1009, "step": 28505 }, { "epoch": 0.86, "learning_rate": 2.5709715542206693e-07, "loss": 1.0659, "step": 28506 }, { "epoch": 0.86, "learning_rate": 2.5698942578349235e-07, "loss": 1.1647, "step": 28507 }, { "epoch": 0.86, "learning_rate": 2.5688171749729843e-07, "loss": 1.052, "step": 28508 }, { "epoch": 0.86, "learning_rate": 2.5677403056451056e-07, "loss": 1.0338, "step": 28509 }, { "epoch": 0.86, "learning_rate": 2.566663649861531e-07, "loss": 1.1433, "step": 28510 }, { "epoch": 0.86, "learning_rate": 2.565587207632514e-07, "loss": 1.0926, "step": 28511 }, { "epoch": 0.86, "learning_rate": 2.564510978968301e-07, "loss": 1.0155, "step": 28512 }, { "epoch": 0.86, "learning_rate": 2.563434963879144e-07, "loss": 1.1016, "step": 28513 }, { "epoch": 0.86, "learning_rate": 2.5623591623752745e-07, "loss": 1.2075, "step": 28514 }, { "epoch": 0.86, "learning_rate": 2.5612835744669413e-07, "loss": 1.1359, "step": 28515 }, { "epoch": 0.86, "learning_rate": 2.5602082001643794e-07, "loss": 1.054, "step": 28516 }, { "epoch": 0.86, "learning_rate": 2.559133039477835e-07, "loss": 1.1387, "step": 28517 }, { "epoch": 0.86, "learning_rate": 2.5580580924175316e-07, "loss": 0.9663, "step": 28518 }, { "epoch": 0.86, "learning_rate": 2.5569833589937057e-07, "loss": 1.0684, "step": 28519 }, { "epoch": 0.86, "learning_rate": 2.5559088392165893e-07, "loss": 1.0626, "step": 28520 }, { "epoch": 0.86, "learning_rate": 2.554834533096412e-07, "loss": 1.0615, "step": 28521 }, { "epoch": 0.86, "learning_rate": 2.5537604406434046e-07, "loss": 1.0689, "step": 28522 }, { "epoch": 0.86, "learning_rate": 2.5526865618677815e-07, "loss": 1.1833, "step": 28523 }, { "epoch": 0.86, "learning_rate": 2.5516128967797706e-07, "loss": 1.0211, "step": 28524 }, { "epoch": 0.86, "learning_rate": 2.5505394453895966e-07, "loss": 1.1827, "step": 28525 }, { "epoch": 0.86, "learning_rate": 2.549466207707471e-07, "loss": 1.019, "step": 28526 }, { "epoch": 0.86, "learning_rate": 2.5483931837436165e-07, "loss": 1.0116, "step": 28527 }, { "epoch": 0.86, "learning_rate": 2.5473203735082467e-07, "loss": 1.0117, "step": 28528 }, { "epoch": 0.86, "learning_rate": 2.5462477770115736e-07, "loss": 1.0578, "step": 28529 }, { "epoch": 0.86, "learning_rate": 2.5451753942638103e-07, "loss": 1.1712, "step": 28530 }, { "epoch": 0.86, "learning_rate": 2.5441032252751604e-07, "loss": 1.1838, "step": 28531 }, { "epoch": 0.86, "learning_rate": 2.543031270055829e-07, "loss": 1.091, "step": 28532 }, { "epoch": 0.86, "learning_rate": 2.5419595286160283e-07, "loss": 1.1573, "step": 28533 }, { "epoch": 0.86, "learning_rate": 2.540888000965955e-07, "loss": 1.1033, "step": 28534 }, { "epoch": 0.86, "learning_rate": 2.539816687115815e-07, "loss": 1.1048, "step": 28535 }, { "epoch": 0.86, "learning_rate": 2.5387455870758e-07, "loss": 1.3295, "step": 28536 }, { "epoch": 0.86, "learning_rate": 2.5376747008561074e-07, "loss": 1.0531, "step": 28537 }, { "epoch": 0.86, "learning_rate": 2.5366040284669354e-07, "loss": 1.1071, "step": 28538 }, { "epoch": 0.86, "learning_rate": 2.535533569918477e-07, "loss": 1.1477, "step": 28539 }, { "epoch": 0.86, "learning_rate": 2.5344633252209175e-07, "loss": 1.0949, "step": 28540 }, { "epoch": 0.86, "learning_rate": 2.5333932943844455e-07, "loss": 1.0258, "step": 28541 }, { "epoch": 0.86, "learning_rate": 2.532323477419249e-07, "loss": 0.964, "step": 28542 }, { "epoch": 0.86, "learning_rate": 2.531253874335518e-07, "loss": 1.2157, "step": 28543 }, { "epoch": 0.86, "learning_rate": 2.530184485143422e-07, "loss": 1.0018, "step": 28544 }, { "epoch": 0.86, "learning_rate": 2.52911530985315e-07, "loss": 1.1417, "step": 28545 }, { "epoch": 0.86, "learning_rate": 2.5280463484748777e-07, "loss": 1.1123, "step": 28546 }, { "epoch": 0.86, "learning_rate": 2.5269776010187817e-07, "loss": 1.0472, "step": 28547 }, { "epoch": 0.86, "learning_rate": 2.525909067495039e-07, "loss": 1.1805, "step": 28548 }, { "epoch": 0.86, "learning_rate": 2.524840747913815e-07, "loss": 0.979, "step": 28549 }, { "epoch": 0.86, "learning_rate": 2.5237726422852797e-07, "loss": 1.117, "step": 28550 }, { "epoch": 0.86, "learning_rate": 2.522704750619606e-07, "loss": 1.091, "step": 28551 }, { "epoch": 0.86, "learning_rate": 2.521637072926958e-07, "loss": 1.0989, "step": 28552 }, { "epoch": 0.86, "learning_rate": 2.520569609217502e-07, "loss": 1.0664, "step": 28553 }, { "epoch": 0.86, "learning_rate": 2.519502359501394e-07, "loss": 1.0099, "step": 28554 }, { "epoch": 0.86, "learning_rate": 2.5184353237887954e-07, "loss": 1.2057, "step": 28555 }, { "epoch": 0.86, "learning_rate": 2.5173685020898676e-07, "loss": 0.9684, "step": 28556 }, { "epoch": 0.86, "learning_rate": 2.5163018944147604e-07, "loss": 1.0322, "step": 28557 }, { "epoch": 0.86, "learning_rate": 2.515235500773633e-07, "loss": 1.0796, "step": 28558 }, { "epoch": 0.86, "learning_rate": 2.514169321176632e-07, "loss": 1.1089, "step": 28559 }, { "epoch": 0.86, "learning_rate": 2.5131033556339114e-07, "loss": 1.0939, "step": 28560 }, { "epoch": 0.86, "learning_rate": 2.5120376041556205e-07, "loss": 1.1055, "step": 28561 }, { "epoch": 0.86, "learning_rate": 2.510972066751896e-07, "loss": 1.0507, "step": 28562 }, { "epoch": 0.86, "learning_rate": 2.5099067434328886e-07, "loss": 0.9825, "step": 28563 }, { "epoch": 0.86, "learning_rate": 2.508841634208736e-07, "loss": 1.1777, "step": 28564 }, { "epoch": 0.86, "learning_rate": 2.507776739089582e-07, "loss": 1.1019, "step": 28565 }, { "epoch": 0.86, "learning_rate": 2.506712058085559e-07, "loss": 1.0215, "step": 28566 }, { "epoch": 0.86, "learning_rate": 2.5056475912068027e-07, "loss": 1.0848, "step": 28567 }, { "epoch": 0.86, "learning_rate": 2.504583338463448e-07, "loss": 1.1058, "step": 28568 }, { "epoch": 0.86, "learning_rate": 2.503519299865631e-07, "loss": 0.9233, "step": 28569 }, { "epoch": 0.86, "learning_rate": 2.5024554754234683e-07, "loss": 1.091, "step": 28570 }, { "epoch": 0.86, "learning_rate": 2.501391865147096e-07, "loss": 1.0139, "step": 28571 }, { "epoch": 0.86, "learning_rate": 2.5003284690466393e-07, "loss": 1.1045, "step": 28572 }, { "epoch": 0.86, "learning_rate": 2.499265287132216e-07, "loss": 1.075, "step": 28573 }, { "epoch": 0.86, "learning_rate": 2.498202319413959e-07, "loss": 1.0502, "step": 28574 }, { "epoch": 0.86, "learning_rate": 2.497139565901971e-07, "loss": 1.0085, "step": 28575 }, { "epoch": 0.86, "learning_rate": 2.496077026606378e-07, "loss": 1.1722, "step": 28576 }, { "epoch": 0.86, "learning_rate": 2.4950147015372906e-07, "loss": 0.9975, "step": 28577 }, { "epoch": 0.86, "learning_rate": 2.4939525907048315e-07, "loss": 1.0551, "step": 28578 }, { "epoch": 0.86, "learning_rate": 2.4928906941191015e-07, "loss": 1.0458, "step": 28579 }, { "epoch": 0.86, "learning_rate": 2.491829011790209e-07, "loss": 1.1236, "step": 28580 }, { "epoch": 0.86, "learning_rate": 2.4907675437282646e-07, "loss": 1.0339, "step": 28581 }, { "epoch": 0.86, "learning_rate": 2.4897062899433747e-07, "loss": 1.0744, "step": 28582 }, { "epoch": 0.86, "learning_rate": 2.488645250445637e-07, "loss": 1.0506, "step": 28583 }, { "epoch": 0.86, "learning_rate": 2.487584425245157e-07, "loss": 1.0345, "step": 28584 }, { "epoch": 0.86, "learning_rate": 2.4865238143520294e-07, "loss": 1.0058, "step": 28585 }, { "epoch": 0.86, "learning_rate": 2.4854634177763517e-07, "loss": 1.0626, "step": 28586 }, { "epoch": 0.86, "learning_rate": 2.484403235528224e-07, "loss": 1.0544, "step": 28587 }, { "epoch": 0.86, "learning_rate": 2.48334326761773e-07, "loss": 1.1374, "step": 28588 }, { "epoch": 0.86, "learning_rate": 2.4822835140549616e-07, "loss": 1.0593, "step": 28589 }, { "epoch": 0.86, "learning_rate": 2.481223974850011e-07, "loss": 1.1105, "step": 28590 }, { "epoch": 0.86, "learning_rate": 2.480164650012967e-07, "loss": 1.057, "step": 28591 }, { "epoch": 0.86, "learning_rate": 2.4791055395539053e-07, "loss": 1.0488, "step": 28592 }, { "epoch": 0.86, "learning_rate": 2.478046643482912e-07, "loss": 1.0478, "step": 28593 }, { "epoch": 0.86, "learning_rate": 2.4769879618100676e-07, "loss": 1.1288, "step": 28594 }, { "epoch": 0.86, "learning_rate": 2.4759294945454563e-07, "loss": 1.1408, "step": 28595 }, { "epoch": 0.86, "learning_rate": 2.474871241699142e-07, "loss": 1.0046, "step": 28596 }, { "epoch": 0.86, "learning_rate": 2.4738132032812056e-07, "loss": 1.1075, "step": 28597 }, { "epoch": 0.86, "learning_rate": 2.4727553793017197e-07, "loss": 1.061, "step": 28598 }, { "epoch": 0.86, "learning_rate": 2.4716977697707505e-07, "loss": 1.122, "step": 28599 }, { "epoch": 0.86, "learning_rate": 2.4706403746983745e-07, "loss": 1.0491, "step": 28600 }, { "epoch": 0.86, "learning_rate": 2.4695831940946465e-07, "loss": 1.0607, "step": 28601 }, { "epoch": 0.86, "learning_rate": 2.4685262279696366e-07, "loss": 1.1356, "step": 28602 }, { "epoch": 0.86, "learning_rate": 2.467469476333406e-07, "loss": 1.0312, "step": 28603 }, { "epoch": 0.86, "learning_rate": 2.4664129391960167e-07, "loss": 1.1051, "step": 28604 }, { "epoch": 0.86, "learning_rate": 2.4653566165675183e-07, "loss": 1.2046, "step": 28605 }, { "epoch": 0.86, "learning_rate": 2.464300508457976e-07, "loss": 1.156, "step": 28606 }, { "epoch": 0.86, "learning_rate": 2.463244614877436e-07, "loss": 1.0684, "step": 28607 }, { "epoch": 0.86, "learning_rate": 2.4621889358359516e-07, "loss": 1.1505, "step": 28608 }, { "epoch": 0.86, "learning_rate": 2.461133471343577e-07, "loss": 0.9995, "step": 28609 }, { "epoch": 0.86, "learning_rate": 2.460078221410356e-07, "loss": 1.1373, "step": 28610 }, { "epoch": 0.86, "learning_rate": 2.459023186046336e-07, "loss": 1.0787, "step": 28611 }, { "epoch": 0.86, "learning_rate": 2.4579683652615564e-07, "loss": 1.1348, "step": 28612 }, { "epoch": 0.86, "learning_rate": 2.456913759066068e-07, "loss": 1.023, "step": 28613 }, { "epoch": 0.86, "learning_rate": 2.455859367469898e-07, "loss": 1.1224, "step": 28614 }, { "epoch": 0.86, "learning_rate": 2.4548051904830896e-07, "loss": 1.0893, "step": 28615 }, { "epoch": 0.86, "learning_rate": 2.4537512281156776e-07, "loss": 1.0522, "step": 28616 }, { "epoch": 0.86, "learning_rate": 2.4526974803777e-07, "loss": 1.1014, "step": 28617 }, { "epoch": 0.86, "learning_rate": 2.451643947279178e-07, "loss": 1.0997, "step": 28618 }, { "epoch": 0.86, "learning_rate": 2.450590628830146e-07, "loss": 1.013, "step": 28619 }, { "epoch": 0.86, "learning_rate": 2.4495375250406294e-07, "loss": 1.0603, "step": 28620 }, { "epoch": 0.86, "learning_rate": 2.4484846359206614e-07, "loss": 1.057, "step": 28621 }, { "epoch": 0.86, "learning_rate": 2.4474319614802537e-07, "loss": 0.9769, "step": 28622 }, { "epoch": 0.86, "learning_rate": 2.4463795017294346e-07, "loss": 1.0634, "step": 28623 }, { "epoch": 0.86, "learning_rate": 2.4453272566782176e-07, "loss": 1.1089, "step": 28624 }, { "epoch": 0.86, "learning_rate": 2.444275226336623e-07, "loss": 1.139, "step": 28625 }, { "epoch": 0.86, "learning_rate": 2.443223410714668e-07, "loss": 1.127, "step": 28626 }, { "epoch": 0.86, "learning_rate": 2.4421718098223607e-07, "loss": 1.1263, "step": 28627 }, { "epoch": 0.86, "learning_rate": 2.441120423669713e-07, "loss": 1.054, "step": 28628 }, { "epoch": 0.86, "learning_rate": 2.440069252266733e-07, "loss": 1.0658, "step": 28629 }, { "epoch": 0.86, "learning_rate": 2.4390182956234324e-07, "loss": 1.2197, "step": 28630 }, { "epoch": 0.86, "learning_rate": 2.4379675537498094e-07, "loss": 1.1722, "step": 28631 }, { "epoch": 0.86, "learning_rate": 2.436917026655866e-07, "loss": 1.0649, "step": 28632 }, { "epoch": 0.86, "learning_rate": 2.435866714351609e-07, "loss": 1.1273, "step": 28633 }, { "epoch": 0.86, "learning_rate": 2.4348166168470326e-07, "loss": 1.0483, "step": 28634 }, { "epoch": 0.86, "learning_rate": 2.433766734152132e-07, "loss": 1.0692, "step": 28635 }, { "epoch": 0.86, "learning_rate": 2.43271706627691e-07, "loss": 1.1028, "step": 28636 }, { "epoch": 0.86, "learning_rate": 2.4316676132313505e-07, "loss": 1.2136, "step": 28637 }, { "epoch": 0.86, "learning_rate": 2.430618375025442e-07, "loss": 1.1417, "step": 28638 }, { "epoch": 0.86, "learning_rate": 2.429569351669181e-07, "loss": 1.0448, "step": 28639 }, { "epoch": 0.86, "learning_rate": 2.428520543172547e-07, "loss": 1.0513, "step": 28640 }, { "epoch": 0.86, "learning_rate": 2.427471949545526e-07, "loss": 1.0771, "step": 28641 }, { "epoch": 0.86, "learning_rate": 2.4264235707981e-07, "loss": 1.1122, "step": 28642 }, { "epoch": 0.86, "learning_rate": 2.4253754069402584e-07, "loss": 1.0972, "step": 28643 }, { "epoch": 0.86, "learning_rate": 2.424327457981962e-07, "loss": 0.9922, "step": 28644 }, { "epoch": 0.86, "learning_rate": 2.423279723933197e-07, "loss": 1.111, "step": 28645 }, { "epoch": 0.86, "learning_rate": 2.422232204803937e-07, "loss": 1.0967, "step": 28646 }, { "epoch": 0.86, "learning_rate": 2.4211849006041566e-07, "loss": 1.1968, "step": 28647 }, { "epoch": 0.86, "learning_rate": 2.4201378113438144e-07, "loss": 1.0682, "step": 28648 }, { "epoch": 0.86, "learning_rate": 2.4190909370328893e-07, "loss": 1.1348, "step": 28649 }, { "epoch": 0.86, "learning_rate": 2.418044277681342e-07, "loss": 1.1682, "step": 28650 }, { "epoch": 0.86, "learning_rate": 2.416997833299134e-07, "loss": 1.087, "step": 28651 }, { "epoch": 0.86, "learning_rate": 2.4159516038962384e-07, "loss": 1.1534, "step": 28652 }, { "epoch": 0.86, "learning_rate": 2.4149055894826025e-07, "loss": 1.0519, "step": 28653 }, { "epoch": 0.86, "learning_rate": 2.413859790068185e-07, "loss": 1.1406, "step": 28654 }, { "epoch": 0.86, "learning_rate": 2.4128142056629475e-07, "loss": 1.1468, "step": 28655 }, { "epoch": 0.86, "learning_rate": 2.4117688362768425e-07, "loss": 1.1378, "step": 28656 }, { "epoch": 0.86, "learning_rate": 2.410723681919816e-07, "loss": 1.1376, "step": 28657 }, { "epoch": 0.86, "learning_rate": 2.4096787426018204e-07, "loss": 1.1607, "step": 28658 }, { "epoch": 0.86, "learning_rate": 2.408634018332803e-07, "loss": 1.0245, "step": 28659 }, { "epoch": 0.86, "learning_rate": 2.4075895091227153e-07, "loss": 1.1516, "step": 28660 }, { "epoch": 0.86, "learning_rate": 2.406545214981487e-07, "loss": 1.2324, "step": 28661 }, { "epoch": 0.86, "learning_rate": 2.4055011359190695e-07, "loss": 0.9018, "step": 28662 }, { "epoch": 0.86, "learning_rate": 2.4044572719453983e-07, "loss": 1.1736, "step": 28663 }, { "epoch": 0.86, "learning_rate": 2.4034136230704135e-07, "loss": 1.0226, "step": 28664 }, { "epoch": 0.86, "learning_rate": 2.4023701893040457e-07, "loss": 1.0149, "step": 28665 }, { "epoch": 0.86, "learning_rate": 2.4013269706562315e-07, "loss": 1.1005, "step": 28666 }, { "epoch": 0.86, "learning_rate": 2.4002839671368986e-07, "loss": 0.9942, "step": 28667 }, { "epoch": 0.86, "learning_rate": 2.399241178755982e-07, "loss": 1.1489, "step": 28668 }, { "epoch": 0.86, "learning_rate": 2.398198605523405e-07, "loss": 0.9997, "step": 28669 }, { "epoch": 0.86, "learning_rate": 2.397156247449089e-07, "loss": 1.2307, "step": 28670 }, { "epoch": 0.86, "learning_rate": 2.39611410454296e-07, "loss": 1.0488, "step": 28671 }, { "epoch": 0.86, "learning_rate": 2.395072176814939e-07, "loss": 1.1363, "step": 28672 }, { "epoch": 0.86, "learning_rate": 2.3940304642749464e-07, "loss": 1.1512, "step": 28673 }, { "epoch": 0.86, "learning_rate": 2.3929889669328937e-07, "loss": 1.1837, "step": 28674 }, { "epoch": 0.86, "learning_rate": 2.3919476847986957e-07, "loss": 1.0544, "step": 28675 }, { "epoch": 0.86, "learning_rate": 2.3909066178822686e-07, "loss": 1.0135, "step": 28676 }, { "epoch": 0.86, "learning_rate": 2.389865766193522e-07, "loss": 1.031, "step": 28677 }, { "epoch": 0.86, "learning_rate": 2.38882512974237e-07, "loss": 1.1035, "step": 28678 }, { "epoch": 0.86, "learning_rate": 2.387784708538707e-07, "loss": 0.9827, "step": 28679 }, { "epoch": 0.86, "learning_rate": 2.386744502592442e-07, "loss": 1.165, "step": 28680 }, { "epoch": 0.86, "learning_rate": 2.385704511913478e-07, "loss": 0.8938, "step": 28681 }, { "epoch": 0.86, "learning_rate": 2.3846647365117215e-07, "loss": 1.0792, "step": 28682 }, { "epoch": 0.86, "learning_rate": 2.3836251763970615e-07, "loss": 1.0455, "step": 28683 }, { "epoch": 0.86, "learning_rate": 2.3825858315793955e-07, "loss": 1.0938, "step": 28684 }, { "epoch": 0.86, "learning_rate": 2.3815467020686212e-07, "loss": 1.0325, "step": 28685 }, { "epoch": 0.86, "learning_rate": 2.3805077878746309e-07, "loss": 1.21, "step": 28686 }, { "epoch": 0.86, "learning_rate": 2.379469089007308e-07, "loss": 1.072, "step": 28687 }, { "epoch": 0.86, "learning_rate": 2.3784306054765476e-07, "loss": 1.2501, "step": 28688 }, { "epoch": 0.86, "learning_rate": 2.3773923372922309e-07, "loss": 1.1495, "step": 28689 }, { "epoch": 0.86, "learning_rate": 2.376354284464244e-07, "loss": 1.1067, "step": 28690 }, { "epoch": 0.86, "learning_rate": 2.3753164470024708e-07, "loss": 1.0325, "step": 28691 }, { "epoch": 0.86, "learning_rate": 2.3742788249167843e-07, "loss": 1.1736, "step": 28692 }, { "epoch": 0.86, "learning_rate": 2.3732414182170706e-07, "loss": 1.1755, "step": 28693 }, { "epoch": 0.86, "learning_rate": 2.3722042269131994e-07, "loss": 1.1508, "step": 28694 }, { "epoch": 0.86, "learning_rate": 2.3711672510150496e-07, "loss": 1.128, "step": 28695 }, { "epoch": 0.86, "learning_rate": 2.370130490532485e-07, "loss": 1.0274, "step": 28696 }, { "epoch": 0.86, "learning_rate": 2.3690939454753813e-07, "loss": 1.0201, "step": 28697 }, { "epoch": 0.86, "learning_rate": 2.3680576158536e-07, "loss": 1.1204, "step": 28698 }, { "epoch": 0.86, "learning_rate": 2.3670215016770192e-07, "loss": 1.2427, "step": 28699 }, { "epoch": 0.86, "learning_rate": 2.3659856029554867e-07, "loss": 1.2328, "step": 28700 }, { "epoch": 0.86, "learning_rate": 2.3649499196988694e-07, "loss": 1.0697, "step": 28701 }, { "epoch": 0.86, "learning_rate": 2.3639144519170292e-07, "loss": 1.0978, "step": 28702 }, { "epoch": 0.86, "learning_rate": 2.3628791996198247e-07, "loss": 1.1263, "step": 28703 }, { "epoch": 0.86, "learning_rate": 2.3618441628171034e-07, "loss": 1.0778, "step": 28704 }, { "epoch": 0.86, "learning_rate": 2.3608093415187217e-07, "loss": 1.0507, "step": 28705 }, { "epoch": 0.86, "learning_rate": 2.3597747357345353e-07, "loss": 1.1655, "step": 28706 }, { "epoch": 0.86, "learning_rate": 2.3587403454743861e-07, "loss": 1.1115, "step": 28707 }, { "epoch": 0.86, "learning_rate": 2.357706170748131e-07, "loss": 1.0076, "step": 28708 }, { "epoch": 0.86, "learning_rate": 2.3566722115656027e-07, "loss": 1.0914, "step": 28709 }, { "epoch": 0.86, "learning_rate": 2.3556384679366495e-07, "loss": 1.0997, "step": 28710 }, { "epoch": 0.86, "learning_rate": 2.3546049398711108e-07, "loss": 1.139, "step": 28711 }, { "epoch": 0.86, "learning_rate": 2.353571627378834e-07, "loss": 1.0941, "step": 28712 }, { "epoch": 0.86, "learning_rate": 2.3525385304696418e-07, "loss": 1.103, "step": 28713 }, { "epoch": 0.87, "learning_rate": 2.3515056491533768e-07, "loss": 1.1054, "step": 28714 }, { "epoch": 0.87, "learning_rate": 2.3504729834398693e-07, "loss": 1.1288, "step": 28715 }, { "epoch": 0.87, "learning_rate": 2.349440533338951e-07, "loss": 1.0039, "step": 28716 }, { "epoch": 0.87, "learning_rate": 2.3484082988604495e-07, "loss": 1.1566, "step": 28717 }, { "epoch": 0.87, "learning_rate": 2.3473762800141965e-07, "loss": 1.1799, "step": 28718 }, { "epoch": 0.87, "learning_rate": 2.3463444768100085e-07, "loss": 1.044, "step": 28719 }, { "epoch": 0.87, "learning_rate": 2.3453128892577086e-07, "loss": 1.1727, "step": 28720 }, { "epoch": 0.87, "learning_rate": 2.3442815173671197e-07, "loss": 1.0972, "step": 28721 }, { "epoch": 0.87, "learning_rate": 2.3432503611480584e-07, "loss": 1.0868, "step": 28722 }, { "epoch": 0.87, "learning_rate": 2.3422194206103422e-07, "loss": 1.0943, "step": 28723 }, { "epoch": 0.87, "learning_rate": 2.3411886957637853e-07, "loss": 1.2056, "step": 28724 }, { "epoch": 0.87, "learning_rate": 2.3401581866182048e-07, "loss": 1.2151, "step": 28725 }, { "epoch": 0.87, "learning_rate": 2.3391278931833988e-07, "loss": 1.0422, "step": 28726 }, { "epoch": 0.87, "learning_rate": 2.3380978154691814e-07, "loss": 1.11, "step": 28727 }, { "epoch": 0.87, "learning_rate": 2.3370679534853586e-07, "loss": 1.1339, "step": 28728 }, { "epoch": 0.87, "learning_rate": 2.336038307241739e-07, "loss": 1.1478, "step": 28729 }, { "epoch": 0.87, "learning_rate": 2.3350088767481154e-07, "loss": 1.0176, "step": 28730 }, { "epoch": 0.87, "learning_rate": 2.3339796620142906e-07, "loss": 1.1757, "step": 28731 }, { "epoch": 0.87, "learning_rate": 2.3329506630500627e-07, "loss": 1.0411, "step": 28732 }, { "epoch": 0.87, "learning_rate": 2.3319218798652287e-07, "loss": 1.0944, "step": 28733 }, { "epoch": 0.87, "learning_rate": 2.3308933124695842e-07, "loss": 1.1204, "step": 28734 }, { "epoch": 0.87, "learning_rate": 2.3298649608729158e-07, "loss": 1.1174, "step": 28735 }, { "epoch": 0.87, "learning_rate": 2.3288368250850124e-07, "loss": 1.1061, "step": 28736 }, { "epoch": 0.87, "learning_rate": 2.327808905115664e-07, "loss": 1.0472, "step": 28737 }, { "epoch": 0.87, "learning_rate": 2.3267812009746594e-07, "loss": 1.1151, "step": 28738 }, { "epoch": 0.87, "learning_rate": 2.3257537126717743e-07, "loss": 1.0582, "step": 28739 }, { "epoch": 0.87, "learning_rate": 2.324726440216793e-07, "loss": 1.1157, "step": 28740 }, { "epoch": 0.87, "learning_rate": 2.323699383619496e-07, "loss": 1.014, "step": 28741 }, { "epoch": 0.87, "learning_rate": 2.3226725428896645e-07, "loss": 1.1913, "step": 28742 }, { "epoch": 0.87, "learning_rate": 2.3216459180370633e-07, "loss": 1.1033, "step": 28743 }, { "epoch": 0.87, "learning_rate": 2.3206195090714702e-07, "loss": 1.2079, "step": 28744 }, { "epoch": 0.87, "learning_rate": 2.3195933160026578e-07, "loss": 1.1149, "step": 28745 }, { "epoch": 0.87, "learning_rate": 2.318567338840394e-07, "loss": 1.0829, "step": 28746 }, { "epoch": 0.87, "learning_rate": 2.3175415775944427e-07, "loss": 1.0875, "step": 28747 }, { "epoch": 0.87, "learning_rate": 2.316516032274574e-07, "loss": 1.0837, "step": 28748 }, { "epoch": 0.87, "learning_rate": 2.3154907028905465e-07, "loss": 1.0175, "step": 28749 }, { "epoch": 0.87, "learning_rate": 2.3144655894521222e-07, "loss": 1.0196, "step": 28750 }, { "epoch": 0.87, "learning_rate": 2.3134406919690654e-07, "loss": 1.0645, "step": 28751 }, { "epoch": 0.87, "learning_rate": 2.312416010451121e-07, "loss": 1.0547, "step": 28752 }, { "epoch": 0.87, "learning_rate": 2.311391544908051e-07, "loss": 1.2371, "step": 28753 }, { "epoch": 0.87, "learning_rate": 2.3103672953496055e-07, "loss": 1.1009, "step": 28754 }, { "epoch": 0.87, "learning_rate": 2.3093432617855406e-07, "loss": 1.1005, "step": 28755 }, { "epoch": 0.87, "learning_rate": 2.3083194442255959e-07, "loss": 1.1577, "step": 28756 }, { "epoch": 0.87, "learning_rate": 2.3072958426795218e-07, "loss": 1.1068, "step": 28757 }, { "epoch": 0.87, "learning_rate": 2.3062724571570605e-07, "loss": 1.0352, "step": 28758 }, { "epoch": 0.87, "learning_rate": 2.3052492876679543e-07, "loss": 1.1046, "step": 28759 }, { "epoch": 0.87, "learning_rate": 2.3042263342219512e-07, "loss": 1.0408, "step": 28760 }, { "epoch": 0.87, "learning_rate": 2.303203596828779e-07, "loss": 1.1553, "step": 28761 }, { "epoch": 0.87, "learning_rate": 2.302181075498175e-07, "loss": 1.1403, "step": 28762 }, { "epoch": 0.87, "learning_rate": 2.301158770239878e-07, "loss": 1.078, "step": 28763 }, { "epoch": 0.87, "learning_rate": 2.3001366810636195e-07, "loss": 1.1274, "step": 28764 }, { "epoch": 0.87, "learning_rate": 2.2991148079791247e-07, "loss": 1.1761, "step": 28765 }, { "epoch": 0.87, "learning_rate": 2.2980931509961223e-07, "loss": 1.015, "step": 28766 }, { "epoch": 0.87, "learning_rate": 2.2970717101243406e-07, "loss": 1.165, "step": 28767 }, { "epoch": 0.87, "learning_rate": 2.2960504853735078e-07, "loss": 1.1089, "step": 28768 }, { "epoch": 0.87, "learning_rate": 2.2950294767533326e-07, "loss": 1.0364, "step": 28769 }, { "epoch": 0.87, "learning_rate": 2.2940086842735438e-07, "loss": 1.0343, "step": 28770 }, { "epoch": 0.87, "learning_rate": 2.2929881079438553e-07, "loss": 1.0357, "step": 28771 }, { "epoch": 0.87, "learning_rate": 2.2919677477739822e-07, "loss": 1.067, "step": 28772 }, { "epoch": 0.87, "learning_rate": 2.2909476037736438e-07, "loss": 1.2322, "step": 28773 }, { "epoch": 0.87, "learning_rate": 2.289927675952544e-07, "loss": 1.051, "step": 28774 }, { "epoch": 0.87, "learning_rate": 2.288907964320397e-07, "loss": 1.0658, "step": 28775 }, { "epoch": 0.87, "learning_rate": 2.2878884688869063e-07, "loss": 1.1498, "step": 28776 }, { "epoch": 0.87, "learning_rate": 2.2868691896617862e-07, "loss": 1.0165, "step": 28777 }, { "epoch": 0.87, "learning_rate": 2.2858501266547262e-07, "loss": 1.0657, "step": 28778 }, { "epoch": 0.87, "learning_rate": 2.2848312798754325e-07, "loss": 1.205, "step": 28779 }, { "epoch": 0.87, "learning_rate": 2.2838126493336055e-07, "loss": 1.142, "step": 28780 }, { "epoch": 0.87, "learning_rate": 2.2827942350389458e-07, "loss": 1.1921, "step": 28781 }, { "epoch": 0.87, "learning_rate": 2.2817760370011406e-07, "loss": 1.1316, "step": 28782 }, { "epoch": 0.87, "learning_rate": 2.2807580552298868e-07, "loss": 1.1602, "step": 28783 }, { "epoch": 0.87, "learning_rate": 2.279740289734872e-07, "loss": 1.0093, "step": 28784 }, { "epoch": 0.87, "learning_rate": 2.2787227405257878e-07, "loss": 1.1603, "step": 28785 }, { "epoch": 0.87, "learning_rate": 2.2777054076123267e-07, "loss": 1.2377, "step": 28786 }, { "epoch": 0.87, "learning_rate": 2.2766882910041617e-07, "loss": 1.1415, "step": 28787 }, { "epoch": 0.87, "learning_rate": 2.275671390710979e-07, "loss": 1.202, "step": 28788 }, { "epoch": 0.87, "learning_rate": 2.2746547067424602e-07, "loss": 1.0201, "step": 28789 }, { "epoch": 0.87, "learning_rate": 2.273638239108289e-07, "loss": 0.9269, "step": 28790 }, { "epoch": 0.87, "learning_rate": 2.27262198781813e-07, "loss": 1.0402, "step": 28791 }, { "epoch": 0.87, "learning_rate": 2.271605952881667e-07, "loss": 1.1219, "step": 28792 }, { "epoch": 0.87, "learning_rate": 2.2705901343085674e-07, "loss": 1.2167, "step": 28793 }, { "epoch": 0.87, "learning_rate": 2.2695745321085066e-07, "loss": 1.2034, "step": 28794 }, { "epoch": 0.87, "learning_rate": 2.2685591462911438e-07, "loss": 0.9753, "step": 28795 }, { "epoch": 0.87, "learning_rate": 2.2675439768661518e-07, "loss": 1.1408, "step": 28796 }, { "epoch": 0.87, "learning_rate": 2.266529023843192e-07, "loss": 1.2253, "step": 28797 }, { "epoch": 0.87, "learning_rate": 2.265514287231929e-07, "loss": 1.121, "step": 28798 }, { "epoch": 0.87, "learning_rate": 2.2644997670420166e-07, "loss": 1.1177, "step": 28799 }, { "epoch": 0.87, "learning_rate": 2.2634854632831244e-07, "loss": 1.0355, "step": 28800 }, { "epoch": 0.87, "learning_rate": 2.2624713759648946e-07, "loss": 1.0837, "step": 28801 }, { "epoch": 0.87, "learning_rate": 2.2614575050969867e-07, "loss": 1.1416, "step": 28802 }, { "epoch": 0.87, "learning_rate": 2.2604438506890537e-07, "loss": 1.1082, "step": 28803 }, { "epoch": 0.87, "learning_rate": 2.2594304127507405e-07, "loss": 1.2045, "step": 28804 }, { "epoch": 0.87, "learning_rate": 2.2584171912917007e-07, "loss": 1.2551, "step": 28805 }, { "epoch": 0.87, "learning_rate": 2.257404186321574e-07, "loss": 1.0815, "step": 28806 }, { "epoch": 0.87, "learning_rate": 2.2563913978500134e-07, "loss": 1.05, "step": 28807 }, { "epoch": 0.87, "learning_rate": 2.2553788258866449e-07, "loss": 1.0508, "step": 28808 }, { "epoch": 0.87, "learning_rate": 2.2543664704411189e-07, "loss": 1.0503, "step": 28809 }, { "epoch": 0.87, "learning_rate": 2.2533543315230667e-07, "loss": 1.1309, "step": 28810 }, { "epoch": 0.87, "learning_rate": 2.2523424091421276e-07, "loss": 1.2467, "step": 28811 }, { "epoch": 0.87, "learning_rate": 2.2513307033079384e-07, "loss": 1.146, "step": 28812 }, { "epoch": 0.87, "learning_rate": 2.2503192140301195e-07, "loss": 1.0705, "step": 28813 }, { "epoch": 0.87, "learning_rate": 2.2493079413183045e-07, "loss": 1.0713, "step": 28814 }, { "epoch": 0.87, "learning_rate": 2.2482968851821218e-07, "loss": 1.1244, "step": 28815 }, { "epoch": 0.87, "learning_rate": 2.2472860456312002e-07, "loss": 1.0917, "step": 28816 }, { "epoch": 0.87, "learning_rate": 2.246275422675151e-07, "loss": 1.2612, "step": 28817 }, { "epoch": 0.87, "learning_rate": 2.2452650163236028e-07, "loss": 1.1668, "step": 28818 }, { "epoch": 0.87, "learning_rate": 2.2442548265861703e-07, "loss": 1.0222, "step": 28819 }, { "epoch": 0.87, "learning_rate": 2.2432448534724788e-07, "loss": 1.0445, "step": 28820 }, { "epoch": 0.87, "learning_rate": 2.2422350969921318e-07, "loss": 1.1361, "step": 28821 }, { "epoch": 0.87, "learning_rate": 2.241225557154747e-07, "loss": 1.1389, "step": 28822 }, { "epoch": 0.87, "learning_rate": 2.2402162339699301e-07, "loss": 1.1438, "step": 28823 }, { "epoch": 0.87, "learning_rate": 2.239207127447296e-07, "loss": 1.3439, "step": 28824 }, { "epoch": 0.87, "learning_rate": 2.2381982375964535e-07, "loss": 1.084, "step": 28825 }, { "epoch": 0.87, "learning_rate": 2.2371895644269949e-07, "loss": 1.122, "step": 28826 }, { "epoch": 0.87, "learning_rate": 2.236181107948529e-07, "loss": 1.0462, "step": 28827 }, { "epoch": 0.87, "learning_rate": 2.235172868170657e-07, "loss": 1.0754, "step": 28828 }, { "epoch": 0.87, "learning_rate": 2.2341648451029736e-07, "loss": 1.0934, "step": 28829 }, { "epoch": 0.87, "learning_rate": 2.2331570387550767e-07, "loss": 1.1927, "step": 28830 }, { "epoch": 0.87, "learning_rate": 2.2321494491365615e-07, "loss": 1.1276, "step": 28831 }, { "epoch": 0.87, "learning_rate": 2.2311420762570173e-07, "loss": 1.1649, "step": 28832 }, { "epoch": 0.87, "learning_rate": 2.230134920126037e-07, "loss": 1.1422, "step": 28833 }, { "epoch": 0.87, "learning_rate": 2.229127980753204e-07, "loss": 1.0231, "step": 28834 }, { "epoch": 0.87, "learning_rate": 2.2281212581481054e-07, "loss": 1.027, "step": 28835 }, { "epoch": 0.87, "learning_rate": 2.2271147523203252e-07, "loss": 1.1135, "step": 28836 }, { "epoch": 0.87, "learning_rate": 2.2261084632794445e-07, "loss": 1.1494, "step": 28837 }, { "epoch": 0.87, "learning_rate": 2.2251023910350472e-07, "loss": 0.9831, "step": 28838 }, { "epoch": 0.87, "learning_rate": 2.224096535596701e-07, "loss": 1.1188, "step": 28839 }, { "epoch": 0.87, "learning_rate": 2.2230908969739866e-07, "loss": 1.1501, "step": 28840 }, { "epoch": 0.87, "learning_rate": 2.2220854751764804e-07, "loss": 1.1275, "step": 28841 }, { "epoch": 0.87, "learning_rate": 2.2210802702137518e-07, "loss": 1.093, "step": 28842 }, { "epoch": 0.87, "learning_rate": 2.220075282095363e-07, "loss": 1.1389, "step": 28843 }, { "epoch": 0.87, "learning_rate": 2.2190705108308896e-07, "loss": 1.179, "step": 28844 }, { "epoch": 0.87, "learning_rate": 2.2180659564298907e-07, "loss": 1.0952, "step": 28845 }, { "epoch": 0.87, "learning_rate": 2.217061618901936e-07, "loss": 1.2311, "step": 28846 }, { "epoch": 0.87, "learning_rate": 2.2160574982565796e-07, "loss": 1.1136, "step": 28847 }, { "epoch": 0.87, "learning_rate": 2.21505359450338e-07, "loss": 1.1458, "step": 28848 }, { "epoch": 0.87, "learning_rate": 2.2140499076518996e-07, "loss": 1.1029, "step": 28849 }, { "epoch": 0.87, "learning_rate": 2.2130464377116885e-07, "loss": 1.0493, "step": 28850 }, { "epoch": 0.87, "learning_rate": 2.2120431846923057e-07, "loss": 1.0488, "step": 28851 }, { "epoch": 0.87, "learning_rate": 2.2110401486032913e-07, "loss": 1.0942, "step": 28852 }, { "epoch": 0.87, "learning_rate": 2.210037329454198e-07, "loss": 1.073, "step": 28853 }, { "epoch": 0.87, "learning_rate": 2.2090347272545775e-07, "loss": 1.1541, "step": 28854 }, { "epoch": 0.87, "learning_rate": 2.208032342013966e-07, "loss": 1.0676, "step": 28855 }, { "epoch": 0.87, "learning_rate": 2.2070301737419115e-07, "loss": 1.303, "step": 28856 }, { "epoch": 0.87, "learning_rate": 2.2060282224479506e-07, "loss": 1.1943, "step": 28857 }, { "epoch": 0.87, "learning_rate": 2.205026488141626e-07, "loss": 1.174, "step": 28858 }, { "epoch": 0.87, "learning_rate": 2.2040249708324719e-07, "loss": 1.109, "step": 28859 }, { "epoch": 0.87, "learning_rate": 2.2030236705300189e-07, "loss": 1.1216, "step": 28860 }, { "epoch": 0.87, "learning_rate": 2.202022587243799e-07, "loss": 1.147, "step": 28861 }, { "epoch": 0.87, "learning_rate": 2.2010217209833455e-07, "loss": 1.097, "step": 28862 }, { "epoch": 0.87, "learning_rate": 2.2000210717581877e-07, "loss": 1.0742, "step": 28863 }, { "epoch": 0.87, "learning_rate": 2.199020639577848e-07, "loss": 1.0415, "step": 28864 }, { "epoch": 0.87, "learning_rate": 2.1980204244518494e-07, "loss": 1.1052, "step": 28865 }, { "epoch": 0.87, "learning_rate": 2.1970204263897123e-07, "loss": 1.0735, "step": 28866 }, { "epoch": 0.87, "learning_rate": 2.196020645400962e-07, "loss": 1.1436, "step": 28867 }, { "epoch": 0.87, "learning_rate": 2.1950210814951134e-07, "loss": 1.0672, "step": 28868 }, { "epoch": 0.87, "learning_rate": 2.1940217346816783e-07, "loss": 1.0139, "step": 28869 }, { "epoch": 0.87, "learning_rate": 2.1930226049701713e-07, "loss": 1.1146, "step": 28870 }, { "epoch": 0.87, "learning_rate": 2.1920236923701043e-07, "loss": 1.0544, "step": 28871 }, { "epoch": 0.87, "learning_rate": 2.191024996890992e-07, "loss": 0.9909, "step": 28872 }, { "epoch": 0.87, "learning_rate": 2.190026518542332e-07, "loss": 1.0173, "step": 28873 }, { "epoch": 0.87, "learning_rate": 2.1890282573336363e-07, "loss": 1.1871, "step": 28874 }, { "epoch": 0.87, "learning_rate": 2.188030213274403e-07, "loss": 1.0359, "step": 28875 }, { "epoch": 0.87, "learning_rate": 2.1870323863741412e-07, "loss": 1.1055, "step": 28876 }, { "epoch": 0.87, "learning_rate": 2.1860347766423373e-07, "loss": 1.0577, "step": 28877 }, { "epoch": 0.87, "learning_rate": 2.1850373840884982e-07, "loss": 1.1497, "step": 28878 }, { "epoch": 0.87, "learning_rate": 2.184040208722113e-07, "loss": 1.164, "step": 28879 }, { "epoch": 0.87, "learning_rate": 2.1830432505526745e-07, "loss": 1.0616, "step": 28880 }, { "epoch": 0.87, "learning_rate": 2.1820465095896776e-07, "loss": 1.1013, "step": 28881 }, { "epoch": 0.87, "learning_rate": 2.1810499858426093e-07, "loss": 1.0769, "step": 28882 }, { "epoch": 0.87, "learning_rate": 2.1800536793209592e-07, "loss": 1.0161, "step": 28883 }, { "epoch": 0.87, "learning_rate": 2.1790575900342005e-07, "loss": 1.1913, "step": 28884 }, { "epoch": 0.87, "learning_rate": 2.1780617179918252e-07, "loss": 1.0048, "step": 28885 }, { "epoch": 0.87, "learning_rate": 2.177066063203312e-07, "loss": 1.1532, "step": 28886 }, { "epoch": 0.87, "learning_rate": 2.176070625678134e-07, "loss": 1.0762, "step": 28887 }, { "epoch": 0.87, "learning_rate": 2.175075405425775e-07, "loss": 1.0271, "step": 28888 }, { "epoch": 0.87, "learning_rate": 2.1740804024557084e-07, "loss": 1.017, "step": 28889 }, { "epoch": 0.87, "learning_rate": 2.1730856167773983e-07, "loss": 1.0391, "step": 28890 }, { "epoch": 0.87, "learning_rate": 2.1720910484003183e-07, "loss": 1.0609, "step": 28891 }, { "epoch": 0.87, "learning_rate": 2.1710966973339382e-07, "loss": 1.0768, "step": 28892 }, { "epoch": 0.87, "learning_rate": 2.1701025635877228e-07, "loss": 1.0623, "step": 28893 }, { "epoch": 0.87, "learning_rate": 2.169108647171142e-07, "loss": 1.1201, "step": 28894 }, { "epoch": 0.87, "learning_rate": 2.1681149480936443e-07, "loss": 0.9984, "step": 28895 }, { "epoch": 0.87, "learning_rate": 2.1671214663646968e-07, "loss": 1.1693, "step": 28896 }, { "epoch": 0.87, "learning_rate": 2.1661282019937559e-07, "loss": 1.0993, "step": 28897 }, { "epoch": 0.87, "learning_rate": 2.1651351549902834e-07, "loss": 1.0643, "step": 28898 }, { "epoch": 0.87, "learning_rate": 2.164142325363719e-07, "loss": 1.2066, "step": 28899 }, { "epoch": 0.87, "learning_rate": 2.1631497131235247e-07, "loss": 1.1639, "step": 28900 }, { "epoch": 0.87, "learning_rate": 2.1621573182791455e-07, "loss": 1.0085, "step": 28901 }, { "epoch": 0.87, "learning_rate": 2.1611651408400326e-07, "loss": 0.9636, "step": 28902 }, { "epoch": 0.87, "learning_rate": 2.160173180815625e-07, "loss": 1.0623, "step": 28903 }, { "epoch": 0.87, "learning_rate": 2.1591814382153686e-07, "loss": 1.043, "step": 28904 }, { "epoch": 0.87, "learning_rate": 2.1581899130487056e-07, "loss": 1.073, "step": 28905 }, { "epoch": 0.87, "learning_rate": 2.1571986053250698e-07, "loss": 1.0797, "step": 28906 }, { "epoch": 0.87, "learning_rate": 2.1562075150539096e-07, "loss": 0.9639, "step": 28907 }, { "epoch": 0.87, "learning_rate": 2.155216642244648e-07, "loss": 1.0383, "step": 28908 }, { "epoch": 0.87, "learning_rate": 2.154225986906719e-07, "loss": 1.0345, "step": 28909 }, { "epoch": 0.87, "learning_rate": 2.1532355490495565e-07, "loss": 1.0988, "step": 28910 }, { "epoch": 0.87, "learning_rate": 2.1522453286825895e-07, "loss": 1.1346, "step": 28911 }, { "epoch": 0.87, "learning_rate": 2.1512553258152408e-07, "loss": 1.1629, "step": 28912 }, { "epoch": 0.87, "learning_rate": 2.150265540456939e-07, "loss": 1.0927, "step": 28913 }, { "epoch": 0.87, "learning_rate": 2.1492759726171041e-07, "loss": 1.045, "step": 28914 }, { "epoch": 0.87, "learning_rate": 2.1482866223051596e-07, "loss": 1.002, "step": 28915 }, { "epoch": 0.87, "learning_rate": 2.147297489530517e-07, "loss": 1.0363, "step": 28916 }, { "epoch": 0.87, "learning_rate": 2.146308574302597e-07, "loss": 1.0659, "step": 28917 }, { "epoch": 0.87, "learning_rate": 2.1453198766308136e-07, "loss": 1.1268, "step": 28918 }, { "epoch": 0.87, "learning_rate": 2.1443313965245765e-07, "loss": 1.0746, "step": 28919 }, { "epoch": 0.87, "learning_rate": 2.1433431339933002e-07, "loss": 0.9622, "step": 28920 }, { "epoch": 0.87, "learning_rate": 2.1423550890463857e-07, "loss": 1.0661, "step": 28921 }, { "epoch": 0.87, "learning_rate": 2.1413672616932418e-07, "loss": 1.1349, "step": 28922 }, { "epoch": 0.87, "learning_rate": 2.1403796519432723e-07, "loss": 1.2272, "step": 28923 }, { "epoch": 0.87, "learning_rate": 2.1393922598058835e-07, "loss": 1.1762, "step": 28924 }, { "epoch": 0.87, "learning_rate": 2.1384050852904654e-07, "loss": 1.1559, "step": 28925 }, { "epoch": 0.87, "learning_rate": 2.137418128406421e-07, "loss": 1.1998, "step": 28926 }, { "epoch": 0.87, "learning_rate": 2.136431389163146e-07, "loss": 1.0995, "step": 28927 }, { "epoch": 0.87, "learning_rate": 2.1354448675700357e-07, "loss": 1.0968, "step": 28928 }, { "epoch": 0.87, "learning_rate": 2.1344585636364768e-07, "loss": 1.0516, "step": 28929 }, { "epoch": 0.87, "learning_rate": 2.1334724773718562e-07, "loss": 1.0911, "step": 28930 }, { "epoch": 0.87, "learning_rate": 2.1324866087855667e-07, "loss": 1.0668, "step": 28931 }, { "epoch": 0.87, "learning_rate": 2.1315009578869895e-07, "loss": 1.0982, "step": 28932 }, { "epoch": 0.87, "learning_rate": 2.130515524685517e-07, "loss": 1.102, "step": 28933 }, { "epoch": 0.87, "learning_rate": 2.1295303091905139e-07, "loss": 0.9312, "step": 28934 }, { "epoch": 0.87, "learning_rate": 2.1285453114113703e-07, "loss": 1.0615, "step": 28935 }, { "epoch": 0.87, "learning_rate": 2.1275605313574588e-07, "loss": 1.1033, "step": 28936 }, { "epoch": 0.87, "learning_rate": 2.1265759690381554e-07, "loss": 1.127, "step": 28937 }, { "epoch": 0.87, "learning_rate": 2.1255916244628334e-07, "loss": 0.9957, "step": 28938 }, { "epoch": 0.87, "learning_rate": 2.1246074976408627e-07, "loss": 1.1282, "step": 28939 }, { "epoch": 0.87, "learning_rate": 2.123623588581611e-07, "loss": 1.0359, "step": 28940 }, { "epoch": 0.87, "learning_rate": 2.1226398972944483e-07, "loss": 1.1329, "step": 28941 }, { "epoch": 0.87, "learning_rate": 2.1216564237887317e-07, "loss": 1.0503, "step": 28942 }, { "epoch": 0.87, "learning_rate": 2.120673168073828e-07, "loss": 1.1833, "step": 28943 }, { "epoch": 0.87, "learning_rate": 2.1196901301590967e-07, "loss": 1.092, "step": 28944 }, { "epoch": 0.87, "learning_rate": 2.1187073100538968e-07, "loss": 1.0991, "step": 28945 }, { "epoch": 0.87, "learning_rate": 2.117724707767588e-07, "loss": 1.1213, "step": 28946 }, { "epoch": 0.87, "learning_rate": 2.116742323309512e-07, "loss": 0.9972, "step": 28947 }, { "epoch": 0.87, "learning_rate": 2.1157601566890313e-07, "loss": 1.1886, "step": 28948 }, { "epoch": 0.87, "learning_rate": 2.1147782079154884e-07, "loss": 1.1655, "step": 28949 }, { "epoch": 0.87, "learning_rate": 2.1137964769982423e-07, "loss": 1.0785, "step": 28950 }, { "epoch": 0.87, "learning_rate": 2.1128149639466272e-07, "loss": 0.9708, "step": 28951 }, { "epoch": 0.87, "learning_rate": 2.1118336687699914e-07, "loss": 1.057, "step": 28952 }, { "epoch": 0.87, "learning_rate": 2.1108525914776744e-07, "loss": 1.0704, "step": 28953 }, { "epoch": 0.87, "learning_rate": 2.1098717320790217e-07, "loss": 1.1014, "step": 28954 }, { "epoch": 0.87, "learning_rate": 2.108891090583362e-07, "loss": 1.2323, "step": 28955 }, { "epoch": 0.87, "learning_rate": 2.1079106670000322e-07, "loss": 1.1669, "step": 28956 }, { "epoch": 0.87, "learning_rate": 2.106930461338369e-07, "loss": 1.0175, "step": 28957 }, { "epoch": 0.87, "learning_rate": 2.1059504736077042e-07, "loss": 1.0909, "step": 28958 }, { "epoch": 0.87, "learning_rate": 2.1049707038173662e-07, "loss": 1.0565, "step": 28959 }, { "epoch": 0.87, "learning_rate": 2.1039911519766781e-07, "loss": 1.1554, "step": 28960 }, { "epoch": 0.87, "learning_rate": 2.103011818094966e-07, "loss": 1.1474, "step": 28961 }, { "epoch": 0.87, "learning_rate": 2.102032702181553e-07, "loss": 1.0645, "step": 28962 }, { "epoch": 0.87, "learning_rate": 2.1010538042457618e-07, "loss": 1.0691, "step": 28963 }, { "epoch": 0.87, "learning_rate": 2.1000751242969104e-07, "loss": 1.1806, "step": 28964 }, { "epoch": 0.87, "learning_rate": 2.0990966623443186e-07, "loss": 1.158, "step": 28965 }, { "epoch": 0.87, "learning_rate": 2.098118418397291e-07, "loss": 1.0591, "step": 28966 }, { "epoch": 0.87, "learning_rate": 2.0971403924651497e-07, "loss": 1.1184, "step": 28967 }, { "epoch": 0.87, "learning_rate": 2.0961625845571987e-07, "loss": 0.9332, "step": 28968 }, { "epoch": 0.87, "learning_rate": 2.09518499468275e-07, "loss": 1.1124, "step": 28969 }, { "epoch": 0.87, "learning_rate": 2.0942076228511078e-07, "loss": 1.0573, "step": 28970 }, { "epoch": 0.87, "learning_rate": 2.0932304690715776e-07, "loss": 1.1543, "step": 28971 }, { "epoch": 0.87, "learning_rate": 2.0922535333534665e-07, "loss": 1.0274, "step": 28972 }, { "epoch": 0.87, "learning_rate": 2.0912768157060642e-07, "loss": 1.1255, "step": 28973 }, { "epoch": 0.87, "learning_rate": 2.0903003161386743e-07, "loss": 1.1557, "step": 28974 }, { "epoch": 0.87, "learning_rate": 2.0893240346605893e-07, "loss": 1.1949, "step": 28975 }, { "epoch": 0.87, "learning_rate": 2.08834797128111e-07, "loss": 1.079, "step": 28976 }, { "epoch": 0.87, "learning_rate": 2.087372126009521e-07, "loss": 1.1887, "step": 28977 }, { "epoch": 0.87, "learning_rate": 2.0863964988551145e-07, "loss": 1.0743, "step": 28978 }, { "epoch": 0.87, "learning_rate": 2.0854210898271747e-07, "loss": 0.9619, "step": 28979 }, { "epoch": 0.87, "learning_rate": 2.0844458989349975e-07, "loss": 1.2153, "step": 28980 }, { "epoch": 0.87, "learning_rate": 2.0834709261878528e-07, "loss": 0.9564, "step": 28981 }, { "epoch": 0.87, "learning_rate": 2.0824961715950275e-07, "loss": 1.1306, "step": 28982 }, { "epoch": 0.87, "learning_rate": 2.0815216351658036e-07, "loss": 1.032, "step": 28983 }, { "epoch": 0.87, "learning_rate": 2.0805473169094536e-07, "loss": 1.0384, "step": 28984 }, { "epoch": 0.87, "learning_rate": 2.0795732168352596e-07, "loss": 1.0744, "step": 28985 }, { "epoch": 0.87, "learning_rate": 2.0785993349524858e-07, "loss": 1.1265, "step": 28986 }, { "epoch": 0.87, "learning_rate": 2.0776256712704086e-07, "loss": 0.9879, "step": 28987 }, { "epoch": 0.87, "learning_rate": 2.0766522257982924e-07, "loss": 1.0482, "step": 28988 }, { "epoch": 0.87, "learning_rate": 2.0756789985454134e-07, "loss": 1.158, "step": 28989 }, { "epoch": 0.87, "learning_rate": 2.0747059895210227e-07, "loss": 1.1069, "step": 28990 }, { "epoch": 0.87, "learning_rate": 2.07373319873439e-07, "loss": 1.2102, "step": 28991 }, { "epoch": 0.87, "learning_rate": 2.072760626194778e-07, "loss": 1.0715, "step": 28992 }, { "epoch": 0.87, "learning_rate": 2.07178827191144e-07, "loss": 1.0329, "step": 28993 }, { "epoch": 0.87, "learning_rate": 2.0708161358936386e-07, "loss": 1.0553, "step": 28994 }, { "epoch": 0.87, "learning_rate": 2.0698442181506213e-07, "loss": 1.0875, "step": 28995 }, { "epoch": 0.87, "learning_rate": 2.0688725186916446e-07, "loss": 1.0947, "step": 28996 }, { "epoch": 0.87, "learning_rate": 2.0679010375259573e-07, "loss": 0.9984, "step": 28997 }, { "epoch": 0.87, "learning_rate": 2.0669297746628124e-07, "loss": 1.1112, "step": 28998 }, { "epoch": 0.87, "learning_rate": 2.0659587301114475e-07, "loss": 1.2148, "step": 28999 }, { "epoch": 0.87, "learning_rate": 2.0649879038811077e-07, "loss": 1.2285, "step": 29000 }, { "epoch": 0.87, "learning_rate": 2.0640172959810383e-07, "loss": 1.0502, "step": 29001 }, { "epoch": 0.87, "learning_rate": 2.0630469064204823e-07, "loss": 1.1325, "step": 29002 }, { "epoch": 0.87, "learning_rate": 2.0620767352086679e-07, "loss": 1.1202, "step": 29003 }, { "epoch": 0.87, "learning_rate": 2.061106782354838e-07, "loss": 1.126, "step": 29004 }, { "epoch": 0.87, "learning_rate": 2.0601370478682213e-07, "loss": 1.0898, "step": 29005 }, { "epoch": 0.87, "learning_rate": 2.0591675317580577e-07, "loss": 1.0521, "step": 29006 }, { "epoch": 0.87, "learning_rate": 2.058198234033565e-07, "loss": 0.991, "step": 29007 }, { "epoch": 0.87, "learning_rate": 2.057229154703977e-07, "loss": 1.0566, "step": 29008 }, { "epoch": 0.87, "learning_rate": 2.056260293778517e-07, "loss": 1.1497, "step": 29009 }, { "epoch": 0.87, "learning_rate": 2.0552916512664085e-07, "loss": 1.0731, "step": 29010 }, { "epoch": 0.87, "learning_rate": 2.0543232271768798e-07, "loss": 1.1406, "step": 29011 }, { "epoch": 0.87, "learning_rate": 2.053355021519135e-07, "loss": 1.1447, "step": 29012 }, { "epoch": 0.87, "learning_rate": 2.0523870343024028e-07, "loss": 1.1575, "step": 29013 }, { "epoch": 0.87, "learning_rate": 2.0514192655358923e-07, "loss": 1.098, "step": 29014 }, { "epoch": 0.87, "learning_rate": 2.0504517152288213e-07, "loss": 1.1189, "step": 29015 }, { "epoch": 0.87, "learning_rate": 2.0494843833903933e-07, "loss": 1.0839, "step": 29016 }, { "epoch": 0.87, "learning_rate": 2.0485172700298206e-07, "loss": 1.0474, "step": 29017 }, { "epoch": 0.87, "learning_rate": 2.0475503751563097e-07, "loss": 1.0663, "step": 29018 }, { "epoch": 0.87, "learning_rate": 2.0465836987790644e-07, "loss": 1.0383, "step": 29019 }, { "epoch": 0.87, "learning_rate": 2.0456172409072883e-07, "loss": 1.1407, "step": 29020 }, { "epoch": 0.87, "learning_rate": 2.0446510015501824e-07, "loss": 1.1193, "step": 29021 }, { "epoch": 0.87, "learning_rate": 2.0436849807169422e-07, "loss": 1.0176, "step": 29022 }, { "epoch": 0.87, "learning_rate": 2.0427191784167632e-07, "loss": 0.9821, "step": 29023 }, { "epoch": 0.87, "learning_rate": 2.0417535946588463e-07, "loss": 1.1785, "step": 29024 }, { "epoch": 0.87, "learning_rate": 2.0407882294523758e-07, "loss": 1.0119, "step": 29025 }, { "epoch": 0.87, "learning_rate": 2.0398230828065414e-07, "loss": 1.1144, "step": 29026 }, { "epoch": 0.87, "learning_rate": 2.038858154730533e-07, "loss": 1.0552, "step": 29027 }, { "epoch": 0.87, "learning_rate": 2.0378934452335408e-07, "loss": 1.0698, "step": 29028 }, { "epoch": 0.87, "learning_rate": 2.0369289543247407e-07, "loss": 1.1553, "step": 29029 }, { "epoch": 0.87, "learning_rate": 2.0359646820133195e-07, "loss": 1.1574, "step": 29030 }, { "epoch": 0.87, "learning_rate": 2.0350006283084506e-07, "loss": 1.2496, "step": 29031 }, { "epoch": 0.87, "learning_rate": 2.0340367932193238e-07, "loss": 1.1447, "step": 29032 }, { "epoch": 0.87, "learning_rate": 2.0330731767550988e-07, "loss": 0.9952, "step": 29033 }, { "epoch": 0.87, "learning_rate": 2.0321097789249567e-07, "loss": 1.0603, "step": 29034 }, { "epoch": 0.87, "learning_rate": 2.0311465997380682e-07, "loss": 0.9936, "step": 29035 }, { "epoch": 0.87, "learning_rate": 2.0301836392036005e-07, "loss": 1.0611, "step": 29036 }, { "epoch": 0.87, "learning_rate": 2.0292208973307276e-07, "loss": 1.1105, "step": 29037 }, { "epoch": 0.87, "learning_rate": 2.0282583741286028e-07, "loss": 1.0945, "step": 29038 }, { "epoch": 0.87, "learning_rate": 2.0272960696063964e-07, "loss": 1.1693, "step": 29039 }, { "epoch": 0.87, "learning_rate": 2.0263339837732681e-07, "loss": 1.08, "step": 29040 }, { "epoch": 0.87, "learning_rate": 2.0253721166383773e-07, "loss": 1.0428, "step": 29041 }, { "epoch": 0.87, "learning_rate": 2.0244104682108773e-07, "loss": 1.1353, "step": 29042 }, { "epoch": 0.87, "learning_rate": 2.0234490384999224e-07, "loss": 1.1898, "step": 29043 }, { "epoch": 0.87, "learning_rate": 2.0224878275146686e-07, "loss": 1.2576, "step": 29044 }, { "epoch": 0.87, "learning_rate": 2.021526835264262e-07, "loss": 1.1013, "step": 29045 }, { "epoch": 0.88, "learning_rate": 2.020566061757856e-07, "loss": 1.0834, "step": 29046 }, { "epoch": 0.88, "learning_rate": 2.019605507004596e-07, "loss": 1.0977, "step": 29047 }, { "epoch": 0.88, "learning_rate": 2.0186451710136195e-07, "loss": 1.1815, "step": 29048 }, { "epoch": 0.88, "learning_rate": 2.0176850537940746e-07, "loss": 1.1674, "step": 29049 }, { "epoch": 0.88, "learning_rate": 2.0167251553550955e-07, "loss": 1.1168, "step": 29050 }, { "epoch": 0.88, "learning_rate": 2.0157654757058276e-07, "loss": 1.0117, "step": 29051 }, { "epoch": 0.88, "learning_rate": 2.0148060148554e-07, "loss": 1.017, "step": 29052 }, { "epoch": 0.88, "learning_rate": 2.0138467728129524e-07, "loss": 0.9897, "step": 29053 }, { "epoch": 0.88, "learning_rate": 2.0128877495876136e-07, "loss": 1.0224, "step": 29054 }, { "epoch": 0.88, "learning_rate": 2.0119289451885126e-07, "loss": 1.0688, "step": 29055 }, { "epoch": 0.88, "learning_rate": 2.0109703596247725e-07, "loss": 1.0739, "step": 29056 }, { "epoch": 0.88, "learning_rate": 2.0100119929055252e-07, "loss": 1.1413, "step": 29057 }, { "epoch": 0.88, "learning_rate": 2.0090538450398934e-07, "loss": 1.1075, "step": 29058 }, { "epoch": 0.88, "learning_rate": 2.008095916036995e-07, "loss": 1.1136, "step": 29059 }, { "epoch": 0.88, "learning_rate": 2.007138205905948e-07, "loss": 1.131, "step": 29060 }, { "epoch": 0.88, "learning_rate": 2.0061807146558698e-07, "loss": 1.1406, "step": 29061 }, { "epoch": 0.88, "learning_rate": 2.005223442295884e-07, "loss": 1.1707, "step": 29062 }, { "epoch": 0.88, "learning_rate": 2.004266388835091e-07, "loss": 1.0928, "step": 29063 }, { "epoch": 0.88, "learning_rate": 2.003309554282609e-07, "loss": 1.0601, "step": 29064 }, { "epoch": 0.88, "learning_rate": 2.002352938647542e-07, "loss": 1.0234, "step": 29065 }, { "epoch": 0.88, "learning_rate": 2.001396541938999e-07, "loss": 1.0565, "step": 29066 }, { "epoch": 0.88, "learning_rate": 2.0004403641660896e-07, "loss": 1.1624, "step": 29067 }, { "epoch": 0.88, "learning_rate": 1.9994844053379065e-07, "loss": 1.0967, "step": 29068 }, { "epoch": 0.88, "learning_rate": 1.998528665463556e-07, "loss": 1.0643, "step": 29069 }, { "epoch": 0.88, "learning_rate": 1.9975731445521312e-07, "loss": 1.1328, "step": 29070 }, { "epoch": 0.88, "learning_rate": 1.9966178426127387e-07, "loss": 1.0181, "step": 29071 }, { "epoch": 0.88, "learning_rate": 1.9956627596544598e-07, "loss": 1.1075, "step": 29072 }, { "epoch": 0.88, "learning_rate": 1.994707895686393e-07, "loss": 1.0984, "step": 29073 }, { "epoch": 0.88, "learning_rate": 1.9937532507176284e-07, "loss": 1.0526, "step": 29074 }, { "epoch": 0.88, "learning_rate": 1.9927988247572527e-07, "loss": 1.0231, "step": 29075 }, { "epoch": 0.88, "learning_rate": 1.991844617814348e-07, "loss": 1.1463, "step": 29076 }, { "epoch": 0.88, "learning_rate": 1.990890629898004e-07, "loss": 1.0002, "step": 29077 }, { "epoch": 0.88, "learning_rate": 1.9899368610172997e-07, "loss": 1.1053, "step": 29078 }, { "epoch": 0.88, "learning_rate": 1.988983311181314e-07, "loss": 1.0403, "step": 29079 }, { "epoch": 0.88, "learning_rate": 1.9880299803991283e-07, "loss": 0.9825, "step": 29080 }, { "epoch": 0.88, "learning_rate": 1.987076868679813e-07, "loss": 1.131, "step": 29081 }, { "epoch": 0.88, "learning_rate": 1.986123976032439e-07, "loss": 1.0668, "step": 29082 }, { "epoch": 0.88, "learning_rate": 1.9851713024660824e-07, "loss": 1.0779, "step": 29083 }, { "epoch": 0.88, "learning_rate": 1.9842188479898133e-07, "loss": 1.0292, "step": 29084 }, { "epoch": 0.88, "learning_rate": 1.9832666126126942e-07, "loss": 1.1362, "step": 29085 }, { "epoch": 0.88, "learning_rate": 1.9823145963437902e-07, "loss": 1.0747, "step": 29086 }, { "epoch": 0.88, "learning_rate": 1.9813627991921657e-07, "loss": 1.2219, "step": 29087 }, { "epoch": 0.88, "learning_rate": 1.9804112211668862e-07, "loss": 1.1804, "step": 29088 }, { "epoch": 0.88, "learning_rate": 1.979459862277e-07, "loss": 1.049, "step": 29089 }, { "epoch": 0.88, "learning_rate": 1.9785087225315692e-07, "loss": 1.0916, "step": 29090 }, { "epoch": 0.88, "learning_rate": 1.9775578019396502e-07, "loss": 1.1604, "step": 29091 }, { "epoch": 0.88, "learning_rate": 1.9766071005102888e-07, "loss": 1.1594, "step": 29092 }, { "epoch": 0.88, "learning_rate": 1.9756566182525472e-07, "loss": 1.1371, "step": 29093 }, { "epoch": 0.88, "learning_rate": 1.9747063551754598e-07, "loss": 1.1083, "step": 29094 }, { "epoch": 0.88, "learning_rate": 1.9737563112880776e-07, "loss": 1.0894, "step": 29095 }, { "epoch": 0.88, "learning_rate": 1.9728064865994462e-07, "loss": 1.0251, "step": 29096 }, { "epoch": 0.88, "learning_rate": 1.971856881118611e-07, "loss": 1.0536, "step": 29097 }, { "epoch": 0.88, "learning_rate": 1.970907494854604e-07, "loss": 1.1782, "step": 29098 }, { "epoch": 0.88, "learning_rate": 1.9699583278164653e-07, "loss": 1.1797, "step": 29099 }, { "epoch": 0.88, "learning_rate": 1.9690093800132342e-07, "loss": 1.0185, "step": 29100 }, { "epoch": 0.88, "learning_rate": 1.9680606514539375e-07, "loss": 1.0153, "step": 29101 }, { "epoch": 0.88, "learning_rate": 1.9671121421476147e-07, "loss": 1.095, "step": 29102 }, { "epoch": 0.88, "learning_rate": 1.9661638521032893e-07, "loss": 1.0565, "step": 29103 }, { "epoch": 0.88, "learning_rate": 1.9652157813299904e-07, "loss": 1.1879, "step": 29104 }, { "epoch": 0.88, "learning_rate": 1.964267929836744e-07, "loss": 1.139, "step": 29105 }, { "epoch": 0.88, "learning_rate": 1.9633202976325788e-07, "loss": 1.176, "step": 29106 }, { "epoch": 0.88, "learning_rate": 1.9623728847265018e-07, "loss": 1.0336, "step": 29107 }, { "epoch": 0.88, "learning_rate": 1.9614256911275415e-07, "loss": 1.1318, "step": 29108 }, { "epoch": 0.88, "learning_rate": 1.960478716844713e-07, "loss": 1.1471, "step": 29109 }, { "epoch": 0.88, "learning_rate": 1.9595319618870346e-07, "loss": 1.0749, "step": 29110 }, { "epoch": 0.88, "learning_rate": 1.9585854262635097e-07, "loss": 1.1522, "step": 29111 }, { "epoch": 0.88, "learning_rate": 1.957639109983156e-07, "loss": 1.1675, "step": 29112 }, { "epoch": 0.88, "learning_rate": 1.9566930130549806e-07, "loss": 1.0564, "step": 29113 }, { "epoch": 0.88, "learning_rate": 1.9557471354879926e-07, "loss": 1.1356, "step": 29114 }, { "epoch": 0.88, "learning_rate": 1.9548014772911906e-07, "loss": 1.0861, "step": 29115 }, { "epoch": 0.88, "learning_rate": 1.9538560384735783e-07, "loss": 1.0932, "step": 29116 }, { "epoch": 0.88, "learning_rate": 1.952910819044157e-07, "loss": 1.2293, "step": 29117 }, { "epoch": 0.88, "learning_rate": 1.951965819011925e-07, "loss": 1.256, "step": 29118 }, { "epoch": 0.88, "learning_rate": 1.9510210383858835e-07, "loss": 1.09, "step": 29119 }, { "epoch": 0.88, "learning_rate": 1.950076477175017e-07, "loss": 1.1137, "step": 29120 }, { "epoch": 0.88, "learning_rate": 1.949132135388321e-07, "loss": 1.1296, "step": 29121 }, { "epoch": 0.88, "learning_rate": 1.9481880130347852e-07, "loss": 1.1415, "step": 29122 }, { "epoch": 0.88, "learning_rate": 1.9472441101234003e-07, "loss": 1.0472, "step": 29123 }, { "epoch": 0.88, "learning_rate": 1.9463004266631445e-07, "loss": 1.0999, "step": 29124 }, { "epoch": 0.88, "learning_rate": 1.945356962663006e-07, "loss": 1.0709, "step": 29125 }, { "epoch": 0.88, "learning_rate": 1.9444137181319682e-07, "loss": 1.0965, "step": 29126 }, { "epoch": 0.88, "learning_rate": 1.9434706930790052e-07, "loss": 1.1008, "step": 29127 }, { "epoch": 0.88, "learning_rate": 1.9425278875130987e-07, "loss": 1.1121, "step": 29128 }, { "epoch": 0.88, "learning_rate": 1.9415853014432245e-07, "loss": 1.1552, "step": 29129 }, { "epoch": 0.88, "learning_rate": 1.940642934878348e-07, "loss": 1.0883, "step": 29130 }, { "epoch": 0.88, "learning_rate": 1.9397007878274476e-07, "loss": 1.2009, "step": 29131 }, { "epoch": 0.88, "learning_rate": 1.9387588602994862e-07, "loss": 1.0556, "step": 29132 }, { "epoch": 0.88, "learning_rate": 1.9378171523034368e-07, "loss": 1.082, "step": 29133 }, { "epoch": 0.88, "learning_rate": 1.9368756638482588e-07, "loss": 1.0521, "step": 29134 }, { "epoch": 0.88, "learning_rate": 1.9359343949429178e-07, "loss": 1.1338, "step": 29135 }, { "epoch": 0.88, "learning_rate": 1.9349933455963782e-07, "loss": 1.0759, "step": 29136 }, { "epoch": 0.88, "learning_rate": 1.934052515817589e-07, "loss": 1.1196, "step": 29137 }, { "epoch": 0.88, "learning_rate": 1.933111905615509e-07, "loss": 1.0683, "step": 29138 }, { "epoch": 0.88, "learning_rate": 1.9321715149990955e-07, "loss": 1.0902, "step": 29139 }, { "epoch": 0.88, "learning_rate": 1.931231343977305e-07, "loss": 1.0757, "step": 29140 }, { "epoch": 0.88, "learning_rate": 1.930291392559075e-07, "loss": 1.1026, "step": 29141 }, { "epoch": 0.88, "learning_rate": 1.929351660753362e-07, "loss": 1.1631, "step": 29142 }, { "epoch": 0.88, "learning_rate": 1.9284121485691116e-07, "loss": 0.9124, "step": 29143 }, { "epoch": 0.88, "learning_rate": 1.927472856015264e-07, "loss": 1.0937, "step": 29144 }, { "epoch": 0.88, "learning_rate": 1.9265337831007647e-07, "loss": 1.0977, "step": 29145 }, { "epoch": 0.88, "learning_rate": 1.925594929834551e-07, "loss": 1.1079, "step": 29146 }, { "epoch": 0.88, "learning_rate": 1.9246562962255577e-07, "loss": 1.1129, "step": 29147 }, { "epoch": 0.88, "learning_rate": 1.9237178822827246e-07, "loss": 1.0672, "step": 29148 }, { "epoch": 0.88, "learning_rate": 1.9227796880149864e-07, "loss": 1.1874, "step": 29149 }, { "epoch": 0.88, "learning_rate": 1.9218417134312662e-07, "loss": 1.0886, "step": 29150 }, { "epoch": 0.88, "learning_rate": 1.9209039585405014e-07, "loss": 1.125, "step": 29151 }, { "epoch": 0.88, "learning_rate": 1.919966423351613e-07, "loss": 1.2153, "step": 29152 }, { "epoch": 0.88, "learning_rate": 1.9190291078735324e-07, "loss": 1.0264, "step": 29153 }, { "epoch": 0.88, "learning_rate": 1.9180920121151748e-07, "loss": 1.0644, "step": 29154 }, { "epoch": 0.88, "learning_rate": 1.9171551360854661e-07, "loss": 1.0435, "step": 29155 }, { "epoch": 0.88, "learning_rate": 1.916218479793322e-07, "loss": 1.2036, "step": 29156 }, { "epoch": 0.88, "learning_rate": 1.9152820432476598e-07, "loss": 1.0956, "step": 29157 }, { "epoch": 0.88, "learning_rate": 1.9143458264573976e-07, "loss": 0.9852, "step": 29158 }, { "epoch": 0.88, "learning_rate": 1.9134098294314425e-07, "loss": 1.1033, "step": 29159 }, { "epoch": 0.88, "learning_rate": 1.9124740521787062e-07, "loss": 1.1104, "step": 29160 }, { "epoch": 0.88, "learning_rate": 1.9115384947080984e-07, "loss": 1.0808, "step": 29161 }, { "epoch": 0.88, "learning_rate": 1.9106031570285287e-07, "loss": 1.1428, "step": 29162 }, { "epoch": 0.88, "learning_rate": 1.909668039148893e-07, "loss": 1.0554, "step": 29163 }, { "epoch": 0.88, "learning_rate": 1.9087331410780953e-07, "loss": 1.19, "step": 29164 }, { "epoch": 0.88, "learning_rate": 1.907798462825039e-07, "loss": 1.1964, "step": 29165 }, { "epoch": 0.88, "learning_rate": 1.9068640043986232e-07, "loss": 1.0338, "step": 29166 }, { "epoch": 0.88, "learning_rate": 1.9059297658077347e-07, "loss": 1.1602, "step": 29167 }, { "epoch": 0.88, "learning_rate": 1.9049957470612752e-07, "loss": 1.0253, "step": 29168 }, { "epoch": 0.88, "learning_rate": 1.9040619481681317e-07, "loss": 1.1232, "step": 29169 }, { "epoch": 0.88, "learning_rate": 1.9031283691371943e-07, "loss": 1.1541, "step": 29170 }, { "epoch": 0.88, "learning_rate": 1.9021950099773533e-07, "loss": 1.162, "step": 29171 }, { "epoch": 0.88, "learning_rate": 1.9012618706974907e-07, "loss": 1.1005, "step": 29172 }, { "epoch": 0.88, "learning_rate": 1.9003289513064904e-07, "loss": 1.1362, "step": 29173 }, { "epoch": 0.88, "learning_rate": 1.8993962518132319e-07, "loss": 1.1749, "step": 29174 }, { "epoch": 0.88, "learning_rate": 1.8984637722265998e-07, "loss": 0.9532, "step": 29175 }, { "epoch": 0.88, "learning_rate": 1.8975315125554617e-07, "loss": 1.0528, "step": 29176 }, { "epoch": 0.88, "learning_rate": 1.8965994728086968e-07, "loss": 0.9964, "step": 29177 }, { "epoch": 0.88, "learning_rate": 1.8956676529951812e-07, "loss": 1.1213, "step": 29178 }, { "epoch": 0.88, "learning_rate": 1.894736053123783e-07, "loss": 1.1371, "step": 29179 }, { "epoch": 0.88, "learning_rate": 1.893804673203367e-07, "loss": 1.0213, "step": 29180 }, { "epoch": 0.88, "learning_rate": 1.8928735132428015e-07, "loss": 1.1072, "step": 29181 }, { "epoch": 0.88, "learning_rate": 1.8919425732509516e-07, "loss": 1.0136, "step": 29182 }, { "epoch": 0.88, "learning_rate": 1.8910118532366794e-07, "loss": 1.1141, "step": 29183 }, { "epoch": 0.88, "learning_rate": 1.8900813532088446e-07, "loss": 1.0628, "step": 29184 }, { "epoch": 0.88, "learning_rate": 1.889151073176304e-07, "loss": 0.9647, "step": 29185 }, { "epoch": 0.88, "learning_rate": 1.8882210131479145e-07, "loss": 1.1086, "step": 29186 }, { "epoch": 0.88, "learning_rate": 1.8872911731325327e-07, "loss": 1.0758, "step": 29187 }, { "epoch": 0.88, "learning_rate": 1.8863615531390102e-07, "loss": 1.0628, "step": 29188 }, { "epoch": 0.88, "learning_rate": 1.8854321531761894e-07, "loss": 1.118, "step": 29189 }, { "epoch": 0.88, "learning_rate": 1.884502973252922e-07, "loss": 1.0187, "step": 29190 }, { "epoch": 0.88, "learning_rate": 1.8835740133780534e-07, "loss": 1.156, "step": 29191 }, { "epoch": 0.88, "learning_rate": 1.8826452735604324e-07, "loss": 1.1104, "step": 29192 }, { "epoch": 0.88, "learning_rate": 1.8817167538088876e-07, "loss": 0.9783, "step": 29193 }, { "epoch": 0.88, "learning_rate": 1.880788454132268e-07, "loss": 1.0912, "step": 29194 }, { "epoch": 0.88, "learning_rate": 1.879860374539408e-07, "loss": 1.1125, "step": 29195 }, { "epoch": 0.88, "learning_rate": 1.8789325150391391e-07, "loss": 1.0596, "step": 29196 }, { "epoch": 0.88, "learning_rate": 1.8780048756403047e-07, "loss": 1.061, "step": 29197 }, { "epoch": 0.88, "learning_rate": 1.8770774563517225e-07, "loss": 1.0573, "step": 29198 }, { "epoch": 0.88, "learning_rate": 1.876150257182227e-07, "loss": 1.2014, "step": 29199 }, { "epoch": 0.88, "learning_rate": 1.875223278140642e-07, "loss": 1.1463, "step": 29200 }, { "epoch": 0.88, "learning_rate": 1.8742965192357993e-07, "loss": 1.0386, "step": 29201 }, { "epoch": 0.88, "learning_rate": 1.8733699804765137e-07, "loss": 1.1378, "step": 29202 }, { "epoch": 0.88, "learning_rate": 1.8724436618716062e-07, "loss": 1.1501, "step": 29203 }, { "epoch": 0.88, "learning_rate": 1.8715175634298976e-07, "loss": 1.0965, "step": 29204 }, { "epoch": 0.88, "learning_rate": 1.8705916851602058e-07, "loss": 1.0984, "step": 29205 }, { "epoch": 0.88, "learning_rate": 1.8696660270713372e-07, "loss": 1.147, "step": 29206 }, { "epoch": 0.88, "learning_rate": 1.8687405891721077e-07, "loss": 0.9958, "step": 29207 }, { "epoch": 0.88, "learning_rate": 1.8678153714713293e-07, "loss": 1.0501, "step": 29208 }, { "epoch": 0.88, "learning_rate": 1.866890373977806e-07, "loss": 1.1827, "step": 29209 }, { "epoch": 0.88, "learning_rate": 1.8659655967003448e-07, "loss": 1.0882, "step": 29210 }, { "epoch": 0.88, "learning_rate": 1.8650410396477526e-07, "loss": 1.0388, "step": 29211 }, { "epoch": 0.88, "learning_rate": 1.8641167028288276e-07, "loss": 1.1749, "step": 29212 }, { "epoch": 0.88, "learning_rate": 1.8631925862523687e-07, "loss": 1.1309, "step": 29213 }, { "epoch": 0.88, "learning_rate": 1.8622686899271686e-07, "loss": 1.0055, "step": 29214 }, { "epoch": 0.88, "learning_rate": 1.8613450138620315e-07, "loss": 1.0369, "step": 29215 }, { "epoch": 0.88, "learning_rate": 1.8604215580657447e-07, "loss": 1.078, "step": 29216 }, { "epoch": 0.88, "learning_rate": 1.8594983225470987e-07, "loss": 1.2625, "step": 29217 }, { "epoch": 0.88, "learning_rate": 1.8585753073148888e-07, "loss": 1.1276, "step": 29218 }, { "epoch": 0.88, "learning_rate": 1.8576525123778915e-07, "loss": 1.2079, "step": 29219 }, { "epoch": 0.88, "learning_rate": 1.8567299377449e-07, "loss": 1.1222, "step": 29220 }, { "epoch": 0.88, "learning_rate": 1.8558075834246902e-07, "loss": 0.9719, "step": 29221 }, { "epoch": 0.88, "learning_rate": 1.8548854494260472e-07, "loss": 1.0911, "step": 29222 }, { "epoch": 0.88, "learning_rate": 1.8539635357577495e-07, "loss": 1.0283, "step": 29223 }, { "epoch": 0.88, "learning_rate": 1.8530418424285685e-07, "loss": 1.1476, "step": 29224 }, { "epoch": 0.88, "learning_rate": 1.8521203694472827e-07, "loss": 1.0145, "step": 29225 }, { "epoch": 0.88, "learning_rate": 1.8511991168226606e-07, "loss": 1.0034, "step": 29226 }, { "epoch": 0.88, "learning_rate": 1.8502780845634781e-07, "loss": 1.0499, "step": 29227 }, { "epoch": 0.88, "learning_rate": 1.8493572726784952e-07, "loss": 0.9625, "step": 29228 }, { "epoch": 0.88, "learning_rate": 1.8484366811764827e-07, "loss": 1.1083, "step": 29229 }, { "epoch": 0.88, "learning_rate": 1.8475163100662025e-07, "loss": 1.1714, "step": 29230 }, { "epoch": 0.88, "learning_rate": 1.84659615935642e-07, "loss": 0.9875, "step": 29231 }, { "epoch": 0.88, "learning_rate": 1.8456762290558873e-07, "loss": 1.1499, "step": 29232 }, { "epoch": 0.88, "learning_rate": 1.844756519173363e-07, "loss": 1.1419, "step": 29233 }, { "epoch": 0.88, "learning_rate": 1.8438370297176072e-07, "loss": 1.1286, "step": 29234 }, { "epoch": 0.88, "learning_rate": 1.8429177606973715e-07, "loss": 1.0507, "step": 29235 }, { "epoch": 0.88, "learning_rate": 1.8419987121214068e-07, "loss": 1.0901, "step": 29236 }, { "epoch": 0.88, "learning_rate": 1.841079883998459e-07, "loss": 1.1788, "step": 29237 }, { "epoch": 0.88, "learning_rate": 1.8401612763372767e-07, "loss": 1.04, "step": 29238 }, { "epoch": 0.88, "learning_rate": 1.8392428891466057e-07, "loss": 1.0823, "step": 29239 }, { "epoch": 0.88, "learning_rate": 1.8383247224351863e-07, "loss": 1.0862, "step": 29240 }, { "epoch": 0.88, "learning_rate": 1.8374067762117614e-07, "loss": 1.0628, "step": 29241 }, { "epoch": 0.88, "learning_rate": 1.8364890504850656e-07, "loss": 1.1187, "step": 29242 }, { "epoch": 0.88, "learning_rate": 1.8355715452638424e-07, "loss": 1.1816, "step": 29243 }, { "epoch": 0.88, "learning_rate": 1.834654260556823e-07, "loss": 1.1747, "step": 29244 }, { "epoch": 0.88, "learning_rate": 1.8337371963727368e-07, "loss": 1.1582, "step": 29245 }, { "epoch": 0.88, "learning_rate": 1.832820352720313e-07, "loss": 0.9574, "step": 29246 }, { "epoch": 0.88, "learning_rate": 1.8319037296082808e-07, "loss": 1.0654, "step": 29247 }, { "epoch": 0.88, "learning_rate": 1.830987327045375e-07, "loss": 1.0712, "step": 29248 }, { "epoch": 0.88, "learning_rate": 1.8300711450403046e-07, "loss": 1.1929, "step": 29249 }, { "epoch": 0.88, "learning_rate": 1.8291551836017968e-07, "loss": 1.0391, "step": 29250 }, { "epoch": 0.88, "learning_rate": 1.8282394427385746e-07, "loss": 1.1157, "step": 29251 }, { "epoch": 0.88, "learning_rate": 1.8273239224593508e-07, "loss": 1.0821, "step": 29252 }, { "epoch": 0.88, "learning_rate": 1.826408622772849e-07, "loss": 1.0641, "step": 29253 }, { "epoch": 0.88, "learning_rate": 1.82549354368777e-07, "loss": 1.1335, "step": 29254 }, { "epoch": 0.88, "learning_rate": 1.8245786852128327e-07, "loss": 1.0739, "step": 29255 }, { "epoch": 0.88, "learning_rate": 1.8236640473567463e-07, "loss": 1.0225, "step": 29256 }, { "epoch": 0.88, "learning_rate": 1.8227496301282178e-07, "loss": 1.0552, "step": 29257 }, { "epoch": 0.88, "learning_rate": 1.8218354335359456e-07, "loss": 1.1395, "step": 29258 }, { "epoch": 0.88, "learning_rate": 1.8209214575886397e-07, "loss": 1.1479, "step": 29259 }, { "epoch": 0.88, "learning_rate": 1.8200077022949958e-07, "loss": 1.0536, "step": 29260 }, { "epoch": 0.88, "learning_rate": 1.8190941676637182e-07, "loss": 1.298, "step": 29261 }, { "epoch": 0.88, "learning_rate": 1.8181808537034995e-07, "loss": 1.1059, "step": 29262 }, { "epoch": 0.88, "learning_rate": 1.8172677604230305e-07, "loss": 1.0507, "step": 29263 }, { "epoch": 0.88, "learning_rate": 1.8163548878310093e-07, "loss": 1.094, "step": 29264 }, { "epoch": 0.88, "learning_rate": 1.815442235936124e-07, "loss": 1.0233, "step": 29265 }, { "epoch": 0.88, "learning_rate": 1.8145298047470615e-07, "loss": 1.032, "step": 29266 }, { "epoch": 0.88, "learning_rate": 1.813617594272507e-07, "loss": 1.0819, "step": 29267 }, { "epoch": 0.88, "learning_rate": 1.8127056045211506e-07, "loss": 1.2079, "step": 29268 }, { "epoch": 0.88, "learning_rate": 1.8117938355016656e-07, "loss": 1.0334, "step": 29269 }, { "epoch": 0.88, "learning_rate": 1.8108822872227428e-07, "loss": 1.1647, "step": 29270 }, { "epoch": 0.88, "learning_rate": 1.8099709596930442e-07, "loss": 0.9678, "step": 29271 }, { "epoch": 0.88, "learning_rate": 1.8090598529212577e-07, "loss": 1.1083, "step": 29272 }, { "epoch": 0.88, "learning_rate": 1.8081489669160485e-07, "loss": 1.0311, "step": 29273 }, { "epoch": 0.88, "learning_rate": 1.8072383016860984e-07, "loss": 1.2333, "step": 29274 }, { "epoch": 0.88, "learning_rate": 1.8063278572400646e-07, "loss": 1.0007, "step": 29275 }, { "epoch": 0.88, "learning_rate": 1.8054176335866175e-07, "loss": 1.088, "step": 29276 }, { "epoch": 0.88, "learning_rate": 1.8045076307344257e-07, "loss": 1.1121, "step": 29277 }, { "epoch": 0.88, "learning_rate": 1.8035978486921485e-07, "loss": 1.0555, "step": 29278 }, { "epoch": 0.88, "learning_rate": 1.8026882874684544e-07, "loss": 1.1825, "step": 29279 }, { "epoch": 0.88, "learning_rate": 1.8017789470719887e-07, "loss": 1.0516, "step": 29280 }, { "epoch": 0.88, "learning_rate": 1.8008698275114173e-07, "loss": 1.0597, "step": 29281 }, { "epoch": 0.88, "learning_rate": 1.7999609287953912e-07, "loss": 1.0912, "step": 29282 }, { "epoch": 0.88, "learning_rate": 1.7990522509325676e-07, "loss": 1.2317, "step": 29283 }, { "epoch": 0.88, "learning_rate": 1.7981437939315894e-07, "loss": 1.1459, "step": 29284 }, { "epoch": 0.88, "learning_rate": 1.7972355578011052e-07, "loss": 1.1889, "step": 29285 }, { "epoch": 0.88, "learning_rate": 1.7963275425497668e-07, "loss": 1.1969, "step": 29286 }, { "epoch": 0.88, "learning_rate": 1.7954197481862168e-07, "loss": 1.1968, "step": 29287 }, { "epoch": 0.88, "learning_rate": 1.7945121747190903e-07, "loss": 1.0251, "step": 29288 }, { "epoch": 0.88, "learning_rate": 1.7936048221570328e-07, "loss": 1.0608, "step": 29289 }, { "epoch": 0.88, "learning_rate": 1.7926976905086825e-07, "loss": 1.0339, "step": 29290 }, { "epoch": 0.88, "learning_rate": 1.7917907797826705e-07, "loss": 1.1509, "step": 29291 }, { "epoch": 0.88, "learning_rate": 1.7908840899876351e-07, "loss": 1.1956, "step": 29292 }, { "epoch": 0.88, "learning_rate": 1.7899776211322052e-07, "loss": 1.1492, "step": 29293 }, { "epoch": 0.88, "learning_rate": 1.7890713732250125e-07, "loss": 1.0493, "step": 29294 }, { "epoch": 0.88, "learning_rate": 1.7881653462746783e-07, "loss": 1.1013, "step": 29295 }, { "epoch": 0.88, "learning_rate": 1.787259540289829e-07, "loss": 1.1068, "step": 29296 }, { "epoch": 0.88, "learning_rate": 1.786353955279091e-07, "loss": 1.0013, "step": 29297 }, { "epoch": 0.88, "learning_rate": 1.785448591251085e-07, "loss": 1.1129, "step": 29298 }, { "epoch": 0.88, "learning_rate": 1.7845434482144265e-07, "loss": 1.1611, "step": 29299 }, { "epoch": 0.88, "learning_rate": 1.7836385261777362e-07, "loss": 1.1481, "step": 29300 }, { "epoch": 0.88, "learning_rate": 1.7827338251496213e-07, "loss": 1.0812, "step": 29301 }, { "epoch": 0.88, "learning_rate": 1.7818293451386998e-07, "loss": 1.1683, "step": 29302 }, { "epoch": 0.88, "learning_rate": 1.7809250861535815e-07, "loss": 1.0707, "step": 29303 }, { "epoch": 0.88, "learning_rate": 1.7800210482028734e-07, "loss": 1.0757, "step": 29304 }, { "epoch": 0.88, "learning_rate": 1.7791172312951855e-07, "loss": 1.2014, "step": 29305 }, { "epoch": 0.88, "learning_rate": 1.7782136354391134e-07, "loss": 1.2924, "step": 29306 }, { "epoch": 0.88, "learning_rate": 1.7773102606432642e-07, "loss": 1.084, "step": 29307 }, { "epoch": 0.88, "learning_rate": 1.7764071069162363e-07, "loss": 1.1146, "step": 29308 }, { "epoch": 0.88, "learning_rate": 1.7755041742666318e-07, "loss": 1.0751, "step": 29309 }, { "epoch": 0.88, "learning_rate": 1.7746014627030378e-07, "loss": 1.1619, "step": 29310 }, { "epoch": 0.88, "learning_rate": 1.7736989722340531e-07, "loss": 1.1334, "step": 29311 }, { "epoch": 0.88, "learning_rate": 1.772796702868268e-07, "loss": 1.1354, "step": 29312 }, { "epoch": 0.88, "learning_rate": 1.7718946546142756e-07, "loss": 1.1253, "step": 29313 }, { "epoch": 0.88, "learning_rate": 1.7709928274806555e-07, "loss": 1.0071, "step": 29314 }, { "epoch": 0.88, "learning_rate": 1.7700912214759947e-07, "loss": 1.0167, "step": 29315 }, { "epoch": 0.88, "learning_rate": 1.7691898366088784e-07, "loss": 1.1245, "step": 29316 }, { "epoch": 0.88, "learning_rate": 1.7682886728878884e-07, "loss": 1.1047, "step": 29317 }, { "epoch": 0.88, "learning_rate": 1.7673877303216015e-07, "loss": 1.1254, "step": 29318 }, { "epoch": 0.88, "learning_rate": 1.7664870089185937e-07, "loss": 1.0918, "step": 29319 }, { "epoch": 0.88, "learning_rate": 1.765586508687439e-07, "loss": 1.0416, "step": 29320 }, { "epoch": 0.88, "learning_rate": 1.7646862296367084e-07, "loss": 1.02, "step": 29321 }, { "epoch": 0.88, "learning_rate": 1.7637861717749783e-07, "loss": 1.1056, "step": 29322 }, { "epoch": 0.88, "learning_rate": 1.7628863351108112e-07, "loss": 1.051, "step": 29323 }, { "epoch": 0.88, "learning_rate": 1.7619867196527724e-07, "loss": 1.0588, "step": 29324 }, { "epoch": 0.88, "learning_rate": 1.7610873254094302e-07, "loss": 1.1569, "step": 29325 }, { "epoch": 0.88, "learning_rate": 1.76018815238935e-07, "loss": 1.0734, "step": 29326 }, { "epoch": 0.88, "learning_rate": 1.7592892006010804e-07, "loss": 1.0038, "step": 29327 }, { "epoch": 0.88, "learning_rate": 1.758390470053184e-07, "loss": 1.1293, "step": 29328 }, { "epoch": 0.88, "learning_rate": 1.757491960754218e-07, "loss": 1.1376, "step": 29329 }, { "epoch": 0.88, "learning_rate": 1.7565936727127337e-07, "loss": 1.1168, "step": 29330 }, { "epoch": 0.88, "learning_rate": 1.7556956059372882e-07, "loss": 1.1893, "step": 29331 }, { "epoch": 0.88, "learning_rate": 1.754797760436419e-07, "loss": 1.1606, "step": 29332 }, { "epoch": 0.88, "learning_rate": 1.7539001362186835e-07, "loss": 1.0546, "step": 29333 }, { "epoch": 0.88, "learning_rate": 1.7530027332926193e-07, "loss": 0.9855, "step": 29334 }, { "epoch": 0.88, "learning_rate": 1.75210555166678e-07, "loss": 1.0961, "step": 29335 }, { "epoch": 0.88, "learning_rate": 1.751208591349693e-07, "loss": 1.075, "step": 29336 }, { "epoch": 0.88, "learning_rate": 1.7503118523499064e-07, "loss": 1.2757, "step": 29337 }, { "epoch": 0.88, "learning_rate": 1.7494153346759496e-07, "loss": 1.1427, "step": 29338 }, { "epoch": 0.88, "learning_rate": 1.7485190383363686e-07, "loss": 1.0558, "step": 29339 }, { "epoch": 0.88, "learning_rate": 1.7476229633396818e-07, "loss": 0.97, "step": 29340 }, { "epoch": 0.88, "learning_rate": 1.7467271096944265e-07, "loss": 1.0613, "step": 29341 }, { "epoch": 0.88, "learning_rate": 1.7458314774091295e-07, "loss": 1.0638, "step": 29342 }, { "epoch": 0.88, "learning_rate": 1.744936066492317e-07, "loss": 1.2128, "step": 29343 }, { "epoch": 0.88, "learning_rate": 1.7440408769525185e-07, "loss": 1.1262, "step": 29344 }, { "epoch": 0.88, "learning_rate": 1.7431459087982438e-07, "loss": 1.092, "step": 29345 }, { "epoch": 0.88, "learning_rate": 1.7422511620380223e-07, "loss": 1.11, "step": 29346 }, { "epoch": 0.88, "learning_rate": 1.7413566366803663e-07, "loss": 1.0403, "step": 29347 }, { "epoch": 0.88, "learning_rate": 1.7404623327337943e-07, "loss": 1.1043, "step": 29348 }, { "epoch": 0.88, "learning_rate": 1.739568250206816e-07, "loss": 1.2338, "step": 29349 }, { "epoch": 0.88, "learning_rate": 1.73867438910795e-07, "loss": 1.1278, "step": 29350 }, { "epoch": 0.88, "learning_rate": 1.7377807494456973e-07, "loss": 1.0435, "step": 29351 }, { "epoch": 0.88, "learning_rate": 1.7368873312285734e-07, "loss": 1.1542, "step": 29352 }, { "epoch": 0.88, "learning_rate": 1.7359941344650744e-07, "loss": 1.0013, "step": 29353 }, { "epoch": 0.88, "learning_rate": 1.7351011591637074e-07, "loss": 1.188, "step": 29354 }, { "epoch": 0.88, "learning_rate": 1.734208405332971e-07, "loss": 1.1456, "step": 29355 }, { "epoch": 0.88, "learning_rate": 1.7333158729813672e-07, "loss": 1.216, "step": 29356 }, { "epoch": 0.88, "learning_rate": 1.732423562117394e-07, "loss": 1.0961, "step": 29357 }, { "epoch": 0.88, "learning_rate": 1.7315314727495398e-07, "loss": 1.0477, "step": 29358 }, { "epoch": 0.88, "learning_rate": 1.7306396048862973e-07, "loss": 0.9603, "step": 29359 }, { "epoch": 0.88, "learning_rate": 1.7297479585361598e-07, "loss": 0.9695, "step": 29360 }, { "epoch": 0.88, "learning_rate": 1.728856533707618e-07, "loss": 1.0233, "step": 29361 }, { "epoch": 0.88, "learning_rate": 1.727965330409151e-07, "loss": 1.1018, "step": 29362 }, { "epoch": 0.88, "learning_rate": 1.7270743486492437e-07, "loss": 1.1287, "step": 29363 }, { "epoch": 0.88, "learning_rate": 1.7261835884363838e-07, "loss": 0.9783, "step": 29364 }, { "epoch": 0.88, "learning_rate": 1.7252930497790477e-07, "loss": 1.0324, "step": 29365 }, { "epoch": 0.88, "learning_rate": 1.7244027326857095e-07, "loss": 1.0949, "step": 29366 }, { "epoch": 0.88, "learning_rate": 1.723512637164848e-07, "loss": 1.0818, "step": 29367 }, { "epoch": 0.88, "learning_rate": 1.7226227632249348e-07, "loss": 1.1337, "step": 29368 }, { "epoch": 0.88, "learning_rate": 1.7217331108744435e-07, "loss": 1.0654, "step": 29369 }, { "epoch": 0.88, "learning_rate": 1.7208436801218447e-07, "loss": 1.0483, "step": 29370 }, { "epoch": 0.88, "learning_rate": 1.7199544709755988e-07, "loss": 0.9969, "step": 29371 }, { "epoch": 0.88, "learning_rate": 1.719065483444174e-07, "loss": 1.0715, "step": 29372 }, { "epoch": 0.88, "learning_rate": 1.7181767175360326e-07, "loss": 1.0634, "step": 29373 }, { "epoch": 0.88, "learning_rate": 1.7172881732596376e-07, "loss": 1.1489, "step": 29374 }, { "epoch": 0.88, "learning_rate": 1.7163998506234432e-07, "loss": 1.1253, "step": 29375 }, { "epoch": 0.88, "learning_rate": 1.7155117496359148e-07, "loss": 1.0438, "step": 29376 }, { "epoch": 0.88, "learning_rate": 1.7146238703054957e-07, "loss": 1.0264, "step": 29377 }, { "epoch": 0.89, "learning_rate": 1.713736212640643e-07, "loss": 1.0981, "step": 29378 }, { "epoch": 0.89, "learning_rate": 1.712848776649806e-07, "loss": 1.0681, "step": 29379 }, { "epoch": 0.89, "learning_rate": 1.7119615623414326e-07, "loss": 1.1254, "step": 29380 }, { "epoch": 0.89, "learning_rate": 1.7110745697239722e-07, "loss": 1.0996, "step": 29381 }, { "epoch": 0.89, "learning_rate": 1.7101877988058625e-07, "loss": 1.1099, "step": 29382 }, { "epoch": 0.89, "learning_rate": 1.709301249595552e-07, "loss": 1.0795, "step": 29383 }, { "epoch": 0.89, "learning_rate": 1.7084149221014758e-07, "loss": 1.002, "step": 29384 }, { "epoch": 0.89, "learning_rate": 1.7075288163320685e-07, "loss": 1.0173, "step": 29385 }, { "epoch": 0.89, "learning_rate": 1.706642932295771e-07, "loss": 1.1194, "step": 29386 }, { "epoch": 0.89, "learning_rate": 1.7057572700010156e-07, "loss": 1.046, "step": 29387 }, { "epoch": 0.89, "learning_rate": 1.7048718294562312e-07, "loss": 1.0325, "step": 29388 }, { "epoch": 0.89, "learning_rate": 1.7039866106698443e-07, "loss": 1.1699, "step": 29389 }, { "epoch": 0.89, "learning_rate": 1.7031016136502877e-07, "loss": 1.0775, "step": 29390 }, { "epoch": 0.89, "learning_rate": 1.7022168384059871e-07, "loss": 1.1857, "step": 29391 }, { "epoch": 0.89, "learning_rate": 1.7013322849453588e-07, "loss": 1.1307, "step": 29392 }, { "epoch": 0.89, "learning_rate": 1.7004479532768235e-07, "loss": 1.1212, "step": 29393 }, { "epoch": 0.89, "learning_rate": 1.6995638434088053e-07, "loss": 1.0843, "step": 29394 }, { "epoch": 0.89, "learning_rate": 1.6986799553497135e-07, "loss": 1.119, "step": 29395 }, { "epoch": 0.89, "learning_rate": 1.6977962891079725e-07, "loss": 1.0804, "step": 29396 }, { "epoch": 0.89, "learning_rate": 1.6969128446919863e-07, "loss": 1.079, "step": 29397 }, { "epoch": 0.89, "learning_rate": 1.6960296221101624e-07, "loss": 1.1711, "step": 29398 }, { "epoch": 0.89, "learning_rate": 1.695146621370916e-07, "loss": 1.0856, "step": 29399 }, { "epoch": 0.89, "learning_rate": 1.6942638424826519e-07, "loss": 1.1283, "step": 29400 }, { "epoch": 0.89, "learning_rate": 1.6933812854537685e-07, "loss": 1.0732, "step": 29401 }, { "epoch": 0.89, "learning_rate": 1.6924989502926703e-07, "loss": 1.0597, "step": 29402 }, { "epoch": 0.89, "learning_rate": 1.6916168370077561e-07, "loss": 1.0728, "step": 29403 }, { "epoch": 0.89, "learning_rate": 1.6907349456074252e-07, "loss": 1.1397, "step": 29404 }, { "epoch": 0.89, "learning_rate": 1.6898532761000703e-07, "loss": 1.02, "step": 29405 }, { "epoch": 0.89, "learning_rate": 1.6889718284940875e-07, "loss": 1.0495, "step": 29406 }, { "epoch": 0.89, "learning_rate": 1.688090602797865e-07, "loss": 1.022, "step": 29407 }, { "epoch": 0.89, "learning_rate": 1.68720959901979e-07, "loss": 1.0682, "step": 29408 }, { "epoch": 0.89, "learning_rate": 1.686328817168259e-07, "loss": 1.0323, "step": 29409 }, { "epoch": 0.89, "learning_rate": 1.6854482572516455e-07, "loss": 1.0594, "step": 29410 }, { "epoch": 0.89, "learning_rate": 1.6845679192783348e-07, "loss": 1.1399, "step": 29411 }, { "epoch": 0.89, "learning_rate": 1.683687803256709e-07, "loss": 1.1609, "step": 29412 }, { "epoch": 0.89, "learning_rate": 1.6828079091951472e-07, "loss": 1.0703, "step": 29413 }, { "epoch": 0.89, "learning_rate": 1.6819282371020234e-07, "loss": 1.0939, "step": 29414 }, { "epoch": 0.89, "learning_rate": 1.6810487869857117e-07, "loss": 1.1929, "step": 29415 }, { "epoch": 0.89, "learning_rate": 1.680169558854583e-07, "loss": 1.195, "step": 29416 }, { "epoch": 0.89, "learning_rate": 1.679290552717014e-07, "loss": 1.0416, "step": 29417 }, { "epoch": 0.89, "learning_rate": 1.6784117685813644e-07, "loss": 1.0754, "step": 29418 }, { "epoch": 0.89, "learning_rate": 1.6775332064560002e-07, "loss": 1.0294, "step": 29419 }, { "epoch": 0.89, "learning_rate": 1.6766548663492894e-07, "loss": 0.9794, "step": 29420 }, { "epoch": 0.89, "learning_rate": 1.675776748269592e-07, "loss": 1.0228, "step": 29421 }, { "epoch": 0.89, "learning_rate": 1.6748988522252678e-07, "loss": 1.0781, "step": 29422 }, { "epoch": 0.89, "learning_rate": 1.6740211782246717e-07, "loss": 1.0674, "step": 29423 }, { "epoch": 0.89, "learning_rate": 1.673143726276158e-07, "loss": 1.2431, "step": 29424 }, { "epoch": 0.89, "learning_rate": 1.6722664963880836e-07, "loss": 1.0793, "step": 29425 }, { "epoch": 0.89, "learning_rate": 1.6713894885687975e-07, "loss": 1.0664, "step": 29426 }, { "epoch": 0.89, "learning_rate": 1.6705127028266488e-07, "loss": 1.093, "step": 29427 }, { "epoch": 0.89, "learning_rate": 1.6696361391699807e-07, "loss": 1.032, "step": 29428 }, { "epoch": 0.89, "learning_rate": 1.668759797607139e-07, "loss": 1.2001, "step": 29429 }, { "epoch": 0.89, "learning_rate": 1.6678836781464675e-07, "loss": 1.0862, "step": 29430 }, { "epoch": 0.89, "learning_rate": 1.667007780796309e-07, "loss": 1.0947, "step": 29431 }, { "epoch": 0.89, "learning_rate": 1.6661321055649965e-07, "loss": 1.1355, "step": 29432 }, { "epoch": 0.89, "learning_rate": 1.66525665246087e-07, "loss": 1.0634, "step": 29433 }, { "epoch": 0.89, "learning_rate": 1.6643814214922644e-07, "loss": 1.0685, "step": 29434 }, { "epoch": 0.89, "learning_rate": 1.6635064126675037e-07, "loss": 1.0842, "step": 29435 }, { "epoch": 0.89, "learning_rate": 1.662631625994926e-07, "loss": 1.0567, "step": 29436 }, { "epoch": 0.89, "learning_rate": 1.661757061482852e-07, "loss": 1.2234, "step": 29437 }, { "epoch": 0.89, "learning_rate": 1.6608827191396115e-07, "loss": 1.1136, "step": 29438 }, { "epoch": 0.89, "learning_rate": 1.6600085989735337e-07, "loss": 1.1106, "step": 29439 }, { "epoch": 0.89, "learning_rate": 1.6591347009929259e-07, "loss": 1.0439, "step": 29440 }, { "epoch": 0.89, "learning_rate": 1.6582610252061177e-07, "loss": 1.1139, "step": 29441 }, { "epoch": 0.89, "learning_rate": 1.6573875716214216e-07, "loss": 1.1509, "step": 29442 }, { "epoch": 0.89, "learning_rate": 1.6565143402471562e-07, "loss": 1.0595, "step": 29443 }, { "epoch": 0.89, "learning_rate": 1.6556413310916287e-07, "loss": 1.1562, "step": 29444 }, { "epoch": 0.89, "learning_rate": 1.6547685441631518e-07, "loss": 1.1152, "step": 29445 }, { "epoch": 0.89, "learning_rate": 1.6538959794700356e-07, "loss": 0.9971, "step": 29446 }, { "epoch": 0.89, "learning_rate": 1.65302363702059e-07, "loss": 1.0247, "step": 29447 }, { "epoch": 0.89, "learning_rate": 1.6521515168231112e-07, "loss": 1.1446, "step": 29448 }, { "epoch": 0.89, "learning_rate": 1.6512796188859038e-07, "loss": 1.1914, "step": 29449 }, { "epoch": 0.89, "learning_rate": 1.650407943217272e-07, "loss": 1.1746, "step": 29450 }, { "epoch": 0.89, "learning_rate": 1.6495364898255094e-07, "loss": 1.0148, "step": 29451 }, { "epoch": 0.89, "learning_rate": 1.648665258718915e-07, "loss": 1.105, "step": 29452 }, { "epoch": 0.89, "learning_rate": 1.647794249905782e-07, "loss": 1.1041, "step": 29453 }, { "epoch": 0.89, "learning_rate": 1.646923463394398e-07, "loss": 1.0419, "step": 29454 }, { "epoch": 0.89, "learning_rate": 1.646052899193054e-07, "loss": 1.119, "step": 29455 }, { "epoch": 0.89, "learning_rate": 1.6451825573100406e-07, "loss": 1.1732, "step": 29456 }, { "epoch": 0.89, "learning_rate": 1.6443124377536423e-07, "loss": 0.9999, "step": 29457 }, { "epoch": 0.89, "learning_rate": 1.6434425405321392e-07, "loss": 1.0786, "step": 29458 }, { "epoch": 0.89, "learning_rate": 1.6425728656538186e-07, "loss": 1.0071, "step": 29459 }, { "epoch": 0.89, "learning_rate": 1.6417034131269522e-07, "loss": 1.1666, "step": 29460 }, { "epoch": 0.89, "learning_rate": 1.640834182959819e-07, "loss": 1.0826, "step": 29461 }, { "epoch": 0.89, "learning_rate": 1.6399651751606933e-07, "loss": 1.1826, "step": 29462 }, { "epoch": 0.89, "learning_rate": 1.6390963897378486e-07, "loss": 1.0615, "step": 29463 }, { "epoch": 0.89, "learning_rate": 1.6382278266995565e-07, "loss": 1.0599, "step": 29464 }, { "epoch": 0.89, "learning_rate": 1.637359486054088e-07, "loss": 1.0938, "step": 29465 }, { "epoch": 0.89, "learning_rate": 1.6364913678097004e-07, "loss": 1.1234, "step": 29466 }, { "epoch": 0.89, "learning_rate": 1.6356234719746623e-07, "loss": 1.1036, "step": 29467 }, { "epoch": 0.89, "learning_rate": 1.6347557985572388e-07, "loss": 1.1993, "step": 29468 }, { "epoch": 0.89, "learning_rate": 1.6338883475656876e-07, "loss": 1.1069, "step": 29469 }, { "epoch": 0.89, "learning_rate": 1.6330211190082628e-07, "loss": 1.1016, "step": 29470 }, { "epoch": 0.89, "learning_rate": 1.632154112893225e-07, "loss": 1.0203, "step": 29471 }, { "epoch": 0.89, "learning_rate": 1.6312873292288227e-07, "loss": 1.1859, "step": 29472 }, { "epoch": 0.89, "learning_rate": 1.6304207680233163e-07, "loss": 0.9611, "step": 29473 }, { "epoch": 0.89, "learning_rate": 1.6295544292849436e-07, "loss": 1.1039, "step": 29474 }, { "epoch": 0.89, "learning_rate": 1.628688313021959e-07, "loss": 1.2121, "step": 29475 }, { "epoch": 0.89, "learning_rate": 1.6278224192426058e-07, "loss": 1.032, "step": 29476 }, { "epoch": 0.89, "learning_rate": 1.6269567479551246e-07, "loss": 1.1273, "step": 29477 }, { "epoch": 0.89, "learning_rate": 1.6260912991677646e-07, "loss": 0.9918, "step": 29478 }, { "epoch": 0.89, "learning_rate": 1.6252260728887525e-07, "loss": 1.1987, "step": 29479 }, { "epoch": 0.89, "learning_rate": 1.624361069126329e-07, "loss": 1.1129, "step": 29480 }, { "epoch": 0.89, "learning_rate": 1.6234962878887344e-07, "loss": 1.0923, "step": 29481 }, { "epoch": 0.89, "learning_rate": 1.6226317291841958e-07, "loss": 1.077, "step": 29482 }, { "epoch": 0.89, "learning_rate": 1.6217673930209426e-07, "loss": 1.0482, "step": 29483 }, { "epoch": 0.89, "learning_rate": 1.620903279407207e-07, "loss": 1.1111, "step": 29484 }, { "epoch": 0.89, "learning_rate": 1.6200393883512076e-07, "loss": 1.0628, "step": 29485 }, { "epoch": 0.89, "learning_rate": 1.6191757198611768e-07, "loss": 1.0087, "step": 29486 }, { "epoch": 0.89, "learning_rate": 1.61831227394533e-07, "loss": 0.9907, "step": 29487 }, { "epoch": 0.89, "learning_rate": 1.6174490506118913e-07, "loss": 1.2028, "step": 29488 }, { "epoch": 0.89, "learning_rate": 1.616586049869076e-07, "loss": 1.0403, "step": 29489 }, { "epoch": 0.89, "learning_rate": 1.6157232717250976e-07, "loss": 1.0931, "step": 29490 }, { "epoch": 0.89, "learning_rate": 1.614860716188177e-07, "loss": 1.062, "step": 29491 }, { "epoch": 0.89, "learning_rate": 1.6139983832665158e-07, "loss": 1.0219, "step": 29492 }, { "epoch": 0.89, "learning_rate": 1.613136272968327e-07, "loss": 1.1844, "step": 29493 }, { "epoch": 0.89, "learning_rate": 1.612274385301818e-07, "loss": 1.0696, "step": 29494 }, { "epoch": 0.89, "learning_rate": 1.611412720275196e-07, "loss": 1.0461, "step": 29495 }, { "epoch": 0.89, "learning_rate": 1.610551277896655e-07, "loss": 1.0773, "step": 29496 }, { "epoch": 0.89, "learning_rate": 1.609690058174404e-07, "loss": 1.0082, "step": 29497 }, { "epoch": 0.89, "learning_rate": 1.6088290611166375e-07, "loss": 1.14, "step": 29498 }, { "epoch": 0.89, "learning_rate": 1.6079682867315566e-07, "loss": 1.0401, "step": 29499 }, { "epoch": 0.89, "learning_rate": 1.6071077350273469e-07, "loss": 1.119, "step": 29500 }, { "epoch": 0.89, "learning_rate": 1.6062474060122042e-07, "loss": 0.9948, "step": 29501 }, { "epoch": 0.89, "learning_rate": 1.605387299694322e-07, "loss": 1.0681, "step": 29502 }, { "epoch": 0.89, "learning_rate": 1.604527416081883e-07, "loss": 1.0701, "step": 29503 }, { "epoch": 0.89, "learning_rate": 1.6036677551830804e-07, "loss": 1.0776, "step": 29504 }, { "epoch": 0.89, "learning_rate": 1.602808317006091e-07, "loss": 1.0776, "step": 29505 }, { "epoch": 0.89, "learning_rate": 1.6019491015590944e-07, "loss": 1.2014, "step": 29506 }, { "epoch": 0.89, "learning_rate": 1.6010901088502757e-07, "loss": 1.1585, "step": 29507 }, { "epoch": 0.89, "learning_rate": 1.6002313388878144e-07, "loss": 1.0602, "step": 29508 }, { "epoch": 0.89, "learning_rate": 1.5993727916798735e-07, "loss": 1.153, "step": 29509 }, { "epoch": 0.89, "learning_rate": 1.598514467234638e-07, "loss": 1.0803, "step": 29510 }, { "epoch": 0.89, "learning_rate": 1.597656365560271e-07, "loss": 1.0865, "step": 29511 }, { "epoch": 0.89, "learning_rate": 1.5967984866649467e-07, "loss": 1.0022, "step": 29512 }, { "epoch": 0.89, "learning_rate": 1.5959408305568276e-07, "loss": 1.1149, "step": 29513 }, { "epoch": 0.89, "learning_rate": 1.5950833972440792e-07, "loss": 1.0732, "step": 29514 }, { "epoch": 0.89, "learning_rate": 1.594226186734868e-07, "loss": 1.0447, "step": 29515 }, { "epoch": 0.89, "learning_rate": 1.5933691990373478e-07, "loss": 1.0088, "step": 29516 }, { "epoch": 0.89, "learning_rate": 1.592512434159685e-07, "loss": 1.0949, "step": 29517 }, { "epoch": 0.89, "learning_rate": 1.591655892110025e-07, "loss": 1.1547, "step": 29518 }, { "epoch": 0.89, "learning_rate": 1.5907995728965286e-07, "loss": 1.1302, "step": 29519 }, { "epoch": 0.89, "learning_rate": 1.5899434765273475e-07, "loss": 1.0654, "step": 29520 }, { "epoch": 0.89, "learning_rate": 1.5890876030106305e-07, "loss": 1.096, "step": 29521 }, { "epoch": 0.89, "learning_rate": 1.5882319523545243e-07, "loss": 1.0054, "step": 29522 }, { "epoch": 0.89, "learning_rate": 1.5873765245671718e-07, "loss": 1.0101, "step": 29523 }, { "epoch": 0.89, "learning_rate": 1.5865213196567196e-07, "loss": 1.131, "step": 29524 }, { "epoch": 0.89, "learning_rate": 1.5856663376313114e-07, "loss": 1.0253, "step": 29525 }, { "epoch": 0.89, "learning_rate": 1.5848115784990792e-07, "loss": 1.0265, "step": 29526 }, { "epoch": 0.89, "learning_rate": 1.583957042268164e-07, "loss": 1.1505, "step": 29527 }, { "epoch": 0.89, "learning_rate": 1.5831027289467005e-07, "loss": 1.059, "step": 29528 }, { "epoch": 0.89, "learning_rate": 1.5822486385428186e-07, "loss": 1.0267, "step": 29529 }, { "epoch": 0.89, "learning_rate": 1.5813947710646592e-07, "loss": 1.2579, "step": 29530 }, { "epoch": 0.89, "learning_rate": 1.5805411265203352e-07, "loss": 1.1555, "step": 29531 }, { "epoch": 0.89, "learning_rate": 1.5796877049179814e-07, "loss": 1.0853, "step": 29532 }, { "epoch": 0.89, "learning_rate": 1.5788345062657224e-07, "loss": 1.1752, "step": 29533 }, { "epoch": 0.89, "learning_rate": 1.5779815305716818e-07, "loss": 1.1758, "step": 29534 }, { "epoch": 0.89, "learning_rate": 1.5771287778439754e-07, "loss": 1.1115, "step": 29535 }, { "epoch": 0.89, "learning_rate": 1.576276248090719e-07, "loss": 1.0703, "step": 29536 }, { "epoch": 0.89, "learning_rate": 1.5754239413200312e-07, "loss": 0.9792, "step": 29537 }, { "epoch": 0.89, "learning_rate": 1.5745718575400275e-07, "loss": 1.0151, "step": 29538 }, { "epoch": 0.89, "learning_rate": 1.5737199967588185e-07, "loss": 1.1862, "step": 29539 }, { "epoch": 0.89, "learning_rate": 1.572868358984511e-07, "loss": 1.0569, "step": 29540 }, { "epoch": 0.89, "learning_rate": 1.572016944225216e-07, "loss": 1.0616, "step": 29541 }, { "epoch": 0.89, "learning_rate": 1.5711657524890345e-07, "loss": 1.1229, "step": 29542 }, { "epoch": 0.89, "learning_rate": 1.5703147837840716e-07, "loss": 1.0898, "step": 29543 }, { "epoch": 0.89, "learning_rate": 1.569464038118429e-07, "loss": 0.9849, "step": 29544 }, { "epoch": 0.89, "learning_rate": 1.5686135155002002e-07, "loss": 0.9971, "step": 29545 }, { "epoch": 0.89, "learning_rate": 1.56776321593749e-07, "loss": 1.0549, "step": 29546 }, { "epoch": 0.89, "learning_rate": 1.5669131394383919e-07, "loss": 1.0953, "step": 29547 }, { "epoch": 0.89, "learning_rate": 1.566063286010988e-07, "loss": 1.0482, "step": 29548 }, { "epoch": 0.89, "learning_rate": 1.565213655663378e-07, "loss": 1.1747, "step": 29549 }, { "epoch": 0.89, "learning_rate": 1.5643642484036464e-07, "loss": 1.0518, "step": 29550 }, { "epoch": 0.89, "learning_rate": 1.5635150642398843e-07, "loss": 1.132, "step": 29551 }, { "epoch": 0.89, "learning_rate": 1.5626661031801687e-07, "loss": 1.0709, "step": 29552 }, { "epoch": 0.89, "learning_rate": 1.561817365232582e-07, "loss": 1.1202, "step": 29553 }, { "epoch": 0.89, "learning_rate": 1.5609688504052063e-07, "loss": 1.0498, "step": 29554 }, { "epoch": 0.89, "learning_rate": 1.5601205587061214e-07, "loss": 1.1308, "step": 29555 }, { "epoch": 0.89, "learning_rate": 1.5592724901433986e-07, "loss": 1.0051, "step": 29556 }, { "epoch": 0.89, "learning_rate": 1.5584246447251123e-07, "loss": 1.1389, "step": 29557 }, { "epoch": 0.89, "learning_rate": 1.5575770224593333e-07, "loss": 1.0765, "step": 29558 }, { "epoch": 0.89, "learning_rate": 1.5567296233541278e-07, "loss": 1.1198, "step": 29559 }, { "epoch": 0.89, "learning_rate": 1.5558824474175728e-07, "loss": 1.2238, "step": 29560 }, { "epoch": 0.89, "learning_rate": 1.5550354946577195e-07, "loss": 1.2026, "step": 29561 }, { "epoch": 0.89, "learning_rate": 1.554188765082637e-07, "loss": 1.2179, "step": 29562 }, { "epoch": 0.89, "learning_rate": 1.5533422587003881e-07, "loss": 1.0799, "step": 29563 }, { "epoch": 0.89, "learning_rate": 1.5524959755190304e-07, "loss": 1.063, "step": 29564 }, { "epoch": 0.89, "learning_rate": 1.5516499155466157e-07, "loss": 1.0664, "step": 29565 }, { "epoch": 0.89, "learning_rate": 1.5508040787911988e-07, "loss": 1.0447, "step": 29566 }, { "epoch": 0.89, "learning_rate": 1.549958465260834e-07, "loss": 1.1671, "step": 29567 }, { "epoch": 0.89, "learning_rate": 1.5491130749635734e-07, "loss": 1.1848, "step": 29568 }, { "epoch": 0.89, "learning_rate": 1.548267907907458e-07, "loss": 1.0488, "step": 29569 }, { "epoch": 0.89, "learning_rate": 1.5474229641005396e-07, "loss": 1.1014, "step": 29570 }, { "epoch": 0.89, "learning_rate": 1.5465782435508585e-07, "loss": 1.1826, "step": 29571 }, { "epoch": 0.89, "learning_rate": 1.545733746266459e-07, "loss": 1.0963, "step": 29572 }, { "epoch": 0.89, "learning_rate": 1.5448894722553787e-07, "loss": 1.1854, "step": 29573 }, { "epoch": 0.89, "learning_rate": 1.544045421525653e-07, "loss": 1.0502, "step": 29574 }, { "epoch": 0.89, "learning_rate": 1.5432015940853168e-07, "loss": 1.176, "step": 29575 }, { "epoch": 0.89, "learning_rate": 1.5423579899424056e-07, "loss": 1.0921, "step": 29576 }, { "epoch": 0.89, "learning_rate": 1.541514609104952e-07, "loss": 1.1614, "step": 29577 }, { "epoch": 0.89, "learning_rate": 1.5406714515809774e-07, "loss": 1.1478, "step": 29578 }, { "epoch": 0.89, "learning_rate": 1.5398285173785138e-07, "loss": 1.1748, "step": 29579 }, { "epoch": 0.89, "learning_rate": 1.5389858065055802e-07, "loss": 1.1031, "step": 29580 }, { "epoch": 0.89, "learning_rate": 1.538143318970206e-07, "loss": 1.0403, "step": 29581 }, { "epoch": 0.89, "learning_rate": 1.5373010547804101e-07, "loss": 1.0743, "step": 29582 }, { "epoch": 0.89, "learning_rate": 1.5364590139442053e-07, "loss": 1.0674, "step": 29583 }, { "epoch": 0.89, "learning_rate": 1.5356171964696077e-07, "loss": 1.0198, "step": 29584 }, { "epoch": 0.89, "learning_rate": 1.5347756023646355e-07, "loss": 1.1057, "step": 29585 }, { "epoch": 0.89, "learning_rate": 1.5339342316373017e-07, "loss": 1.1755, "step": 29586 }, { "epoch": 0.89, "learning_rate": 1.5330930842956087e-07, "loss": 1.0926, "step": 29587 }, { "epoch": 0.89, "learning_rate": 1.5322521603475692e-07, "loss": 1.159, "step": 29588 }, { "epoch": 0.89, "learning_rate": 1.5314114598011827e-07, "loss": 1.0824, "step": 29589 }, { "epoch": 0.89, "learning_rate": 1.5305709826644645e-07, "loss": 1.1464, "step": 29590 }, { "epoch": 0.89, "learning_rate": 1.5297307289454e-07, "loss": 1.0613, "step": 29591 }, { "epoch": 0.89, "learning_rate": 1.5288906986519969e-07, "loss": 1.1799, "step": 29592 }, { "epoch": 0.89, "learning_rate": 1.5280508917922487e-07, "loss": 1.1153, "step": 29593 }, { "epoch": 0.89, "learning_rate": 1.5272113083741547e-07, "loss": 1.1601, "step": 29594 }, { "epoch": 0.89, "learning_rate": 1.5263719484057028e-07, "loss": 1.1185, "step": 29595 }, { "epoch": 0.89, "learning_rate": 1.5255328118948835e-07, "loss": 1.1501, "step": 29596 }, { "epoch": 0.89, "learning_rate": 1.5246938988496856e-07, "loss": 0.982, "step": 29597 }, { "epoch": 0.89, "learning_rate": 1.5238552092780967e-07, "loss": 1.1011, "step": 29598 }, { "epoch": 0.89, "learning_rate": 1.523016743188105e-07, "loss": 1.1838, "step": 29599 }, { "epoch": 0.89, "learning_rate": 1.5221785005876816e-07, "loss": 1.2737, "step": 29600 }, { "epoch": 0.89, "learning_rate": 1.5213404814848122e-07, "loss": 1.0515, "step": 29601 }, { "epoch": 0.89, "learning_rate": 1.5205026858874733e-07, "loss": 1.0649, "step": 29602 }, { "epoch": 0.89, "learning_rate": 1.519665113803645e-07, "loss": 1.011, "step": 29603 }, { "epoch": 0.89, "learning_rate": 1.5188277652412902e-07, "loss": 1.0591, "step": 29604 }, { "epoch": 0.89, "learning_rate": 1.5179906402083888e-07, "loss": 1.0167, "step": 29605 }, { "epoch": 0.89, "learning_rate": 1.5171537387129066e-07, "loss": 1.1201, "step": 29606 }, { "epoch": 0.89, "learning_rate": 1.516317060762812e-07, "loss": 1.032, "step": 29607 }, { "epoch": 0.89, "learning_rate": 1.515480606366071e-07, "loss": 1.1465, "step": 29608 }, { "epoch": 0.89, "learning_rate": 1.514644375530641e-07, "loss": 1.0742, "step": 29609 }, { "epoch": 0.89, "learning_rate": 1.5138083682644855e-07, "loss": 1.1035, "step": 29610 }, { "epoch": 0.89, "learning_rate": 1.5129725845755615e-07, "loss": 0.9865, "step": 29611 }, { "epoch": 0.89, "learning_rate": 1.5121370244718326e-07, "loss": 1.0919, "step": 29612 }, { "epoch": 0.89, "learning_rate": 1.5113016879612418e-07, "loss": 1.0829, "step": 29613 }, { "epoch": 0.89, "learning_rate": 1.5104665750517473e-07, "loss": 1.1532, "step": 29614 }, { "epoch": 0.89, "learning_rate": 1.5096316857512976e-07, "loss": 0.9819, "step": 29615 }, { "epoch": 0.89, "learning_rate": 1.5087970200678454e-07, "loss": 1.0784, "step": 29616 }, { "epoch": 0.89, "learning_rate": 1.507962578009328e-07, "loss": 1.0921, "step": 29617 }, { "epoch": 0.89, "learning_rate": 1.5071283595836928e-07, "loss": 1.0733, "step": 29618 }, { "epoch": 0.89, "learning_rate": 1.5062943647988798e-07, "loss": 1.1542, "step": 29619 }, { "epoch": 0.89, "learning_rate": 1.5054605936628302e-07, "loss": 1.0601, "step": 29620 }, { "epoch": 0.89, "learning_rate": 1.504627046183482e-07, "loss": 1.0419, "step": 29621 }, { "epoch": 0.89, "learning_rate": 1.503793722368768e-07, "loss": 1.1261, "step": 29622 }, { "epoch": 0.89, "learning_rate": 1.5029606222266235e-07, "loss": 1.2554, "step": 29623 }, { "epoch": 0.89, "learning_rate": 1.5021277457649753e-07, "loss": 1.0732, "step": 29624 }, { "epoch": 0.89, "learning_rate": 1.501295092991753e-07, "loss": 0.9878, "step": 29625 }, { "epoch": 0.89, "learning_rate": 1.500462663914884e-07, "loss": 1.1647, "step": 29626 }, { "epoch": 0.89, "learning_rate": 1.4996304585422922e-07, "loss": 1.1046, "step": 29627 }, { "epoch": 0.89, "learning_rate": 1.498798476881902e-07, "loss": 1.1288, "step": 29628 }, { "epoch": 0.89, "learning_rate": 1.4979667189416347e-07, "loss": 1.1802, "step": 29629 }, { "epoch": 0.89, "learning_rate": 1.497135184729401e-07, "loss": 1.1669, "step": 29630 }, { "epoch": 0.89, "learning_rate": 1.4963038742531216e-07, "loss": 1.2527, "step": 29631 }, { "epoch": 0.89, "learning_rate": 1.4954727875207075e-07, "loss": 1.1085, "step": 29632 }, { "epoch": 0.89, "learning_rate": 1.49464192454008e-07, "loss": 1.0278, "step": 29633 }, { "epoch": 0.89, "learning_rate": 1.4938112853191329e-07, "loss": 1.0661, "step": 29634 }, { "epoch": 0.89, "learning_rate": 1.4929808698657843e-07, "loss": 1.0762, "step": 29635 }, { "epoch": 0.89, "learning_rate": 1.492150678187937e-07, "loss": 1.2071, "step": 29636 }, { "epoch": 0.89, "learning_rate": 1.4913207102934896e-07, "loss": 1.1572, "step": 29637 }, { "epoch": 0.89, "learning_rate": 1.4904909661903556e-07, "loss": 1.0294, "step": 29638 }, { "epoch": 0.89, "learning_rate": 1.4896614458864171e-07, "loss": 1.0086, "step": 29639 }, { "epoch": 0.89, "learning_rate": 1.4888321493895797e-07, "loss": 1.0358, "step": 29640 }, { "epoch": 0.89, "learning_rate": 1.4880030767077393e-07, "loss": 1.0142, "step": 29641 }, { "epoch": 0.89, "learning_rate": 1.4871742278487867e-07, "loss": 1.1069, "step": 29642 }, { "epoch": 0.89, "learning_rate": 1.4863456028206075e-07, "loss": 1.1731, "step": 29643 }, { "epoch": 0.89, "learning_rate": 1.4855172016310954e-07, "loss": 1.0641, "step": 29644 }, { "epoch": 0.89, "learning_rate": 1.4846890242881328e-07, "loss": 1.0618, "step": 29645 }, { "epoch": 0.89, "learning_rate": 1.4838610707996108e-07, "loss": 1.0582, "step": 29646 }, { "epoch": 0.89, "learning_rate": 1.483033341173401e-07, "loss": 1.0482, "step": 29647 }, { "epoch": 0.89, "learning_rate": 1.4822058354173886e-07, "loss": 1.2147, "step": 29648 }, { "epoch": 0.89, "learning_rate": 1.4813785535394503e-07, "loss": 1.126, "step": 29649 }, { "epoch": 0.89, "learning_rate": 1.480551495547461e-07, "loss": 1.2238, "step": 29650 }, { "epoch": 0.89, "learning_rate": 1.4797246614492916e-07, "loss": 1.0425, "step": 29651 }, { "epoch": 0.89, "learning_rate": 1.4788980512528167e-07, "loss": 1.0811, "step": 29652 }, { "epoch": 0.89, "learning_rate": 1.478071664965905e-07, "loss": 1.1448, "step": 29653 }, { "epoch": 0.89, "learning_rate": 1.4772455025964222e-07, "loss": 1.0969, "step": 29654 }, { "epoch": 0.89, "learning_rate": 1.4764195641522372e-07, "loss": 1.0385, "step": 29655 }, { "epoch": 0.89, "learning_rate": 1.4755938496412077e-07, "loss": 1.2067, "step": 29656 }, { "epoch": 0.89, "learning_rate": 1.4747683590711908e-07, "loss": 1.0688, "step": 29657 }, { "epoch": 0.89, "learning_rate": 1.4739430924500503e-07, "loss": 1.028, "step": 29658 }, { "epoch": 0.89, "learning_rate": 1.473118049785646e-07, "loss": 1.1516, "step": 29659 }, { "epoch": 0.89, "learning_rate": 1.4722932310858196e-07, "loss": 1.0805, "step": 29660 }, { "epoch": 0.89, "learning_rate": 1.4714686363584335e-07, "loss": 1.0433, "step": 29661 }, { "epoch": 0.89, "learning_rate": 1.4706442656113345e-07, "loss": 1.1609, "step": 29662 }, { "epoch": 0.89, "learning_rate": 1.469820118852369e-07, "loss": 1.0757, "step": 29663 }, { "epoch": 0.89, "learning_rate": 1.4689961960893868e-07, "loss": 1.1242, "step": 29664 }, { "epoch": 0.89, "learning_rate": 1.4681724973302254e-07, "loss": 1.0543, "step": 29665 }, { "epoch": 0.89, "learning_rate": 1.4673490225827259e-07, "loss": 1.0941, "step": 29666 }, { "epoch": 0.89, "learning_rate": 1.466525771854732e-07, "loss": 1.1394, "step": 29667 }, { "epoch": 0.89, "learning_rate": 1.4657027451540823e-07, "loss": 1.1852, "step": 29668 }, { "epoch": 0.89, "learning_rate": 1.4648799424886033e-07, "loss": 1.1616, "step": 29669 }, { "epoch": 0.89, "learning_rate": 1.4640573638661338e-07, "loss": 1.0606, "step": 29670 }, { "epoch": 0.89, "learning_rate": 1.463235009294503e-07, "loss": 1.0982, "step": 29671 }, { "epoch": 0.89, "learning_rate": 1.462412878781541e-07, "loss": 1.129, "step": 29672 }, { "epoch": 0.89, "learning_rate": 1.4615909723350696e-07, "loss": 0.9667, "step": 29673 }, { "epoch": 0.89, "learning_rate": 1.4607692899629156e-07, "loss": 0.9905, "step": 29674 }, { "epoch": 0.89, "learning_rate": 1.4599478316729032e-07, "loss": 1.1279, "step": 29675 }, { "epoch": 0.89, "learning_rate": 1.4591265974728457e-07, "loss": 1.0248, "step": 29676 }, { "epoch": 0.89, "learning_rate": 1.4583055873705704e-07, "loss": 1.1455, "step": 29677 }, { "epoch": 0.89, "learning_rate": 1.4574848013738846e-07, "loss": 1.1334, "step": 29678 }, { "epoch": 0.89, "learning_rate": 1.4566642394906045e-07, "loss": 1.0834, "step": 29679 }, { "epoch": 0.89, "learning_rate": 1.455843901728543e-07, "loss": 1.1429, "step": 29680 }, { "epoch": 0.89, "learning_rate": 1.4550237880955137e-07, "loss": 1.0975, "step": 29681 }, { "epoch": 0.89, "learning_rate": 1.454203898599313e-07, "loss": 1.2098, "step": 29682 }, { "epoch": 0.89, "learning_rate": 1.453384233247751e-07, "loss": 1.0815, "step": 29683 }, { "epoch": 0.89, "learning_rate": 1.4525647920486302e-07, "loss": 1.1143, "step": 29684 }, { "epoch": 0.89, "learning_rate": 1.4517455750097553e-07, "loss": 0.9445, "step": 29685 }, { "epoch": 0.89, "learning_rate": 1.45092658213892e-07, "loss": 1.0585, "step": 29686 }, { "epoch": 0.89, "learning_rate": 1.4501078134439184e-07, "loss": 1.0782, "step": 29687 }, { "epoch": 0.89, "learning_rate": 1.4492892689325523e-07, "loss": 1.1323, "step": 29688 }, { "epoch": 0.89, "learning_rate": 1.448470948612607e-07, "loss": 1.0944, "step": 29689 }, { "epoch": 0.89, "learning_rate": 1.4476528524918792e-07, "loss": 1.1609, "step": 29690 }, { "epoch": 0.89, "learning_rate": 1.4468349805781517e-07, "loss": 1.1589, "step": 29691 }, { "epoch": 0.89, "learning_rate": 1.4460173328792098e-07, "loss": 1.0898, "step": 29692 }, { "epoch": 0.89, "learning_rate": 1.445199909402839e-07, "loss": 1.0137, "step": 29693 }, { "epoch": 0.89, "learning_rate": 1.444382710156825e-07, "loss": 1.2548, "step": 29694 }, { "epoch": 0.89, "learning_rate": 1.4435657351489385e-07, "loss": 1.1932, "step": 29695 }, { "epoch": 0.89, "learning_rate": 1.442748984386963e-07, "loss": 1.1192, "step": 29696 }, { "epoch": 0.89, "learning_rate": 1.4419324578786697e-07, "loss": 1.1293, "step": 29697 }, { "epoch": 0.89, "learning_rate": 1.441116155631836e-07, "loss": 1.0609, "step": 29698 }, { "epoch": 0.89, "learning_rate": 1.4403000776542275e-07, "loss": 1.0322, "step": 29699 }, { "epoch": 0.89, "learning_rate": 1.439484223953616e-07, "loss": 1.1065, "step": 29700 }, { "epoch": 0.89, "learning_rate": 1.4386685945377677e-07, "loss": 1.0167, "step": 29701 }, { "epoch": 0.89, "learning_rate": 1.4378531894144483e-07, "loss": 1.0569, "step": 29702 }, { "epoch": 0.89, "learning_rate": 1.4370380085914154e-07, "loss": 1.0377, "step": 29703 }, { "epoch": 0.89, "learning_rate": 1.4362230520764352e-07, "loss": 1.017, "step": 29704 }, { "epoch": 0.89, "learning_rate": 1.4354083198772602e-07, "loss": 1.1459, "step": 29705 }, { "epoch": 0.89, "learning_rate": 1.4345938120016555e-07, "loss": 1.1125, "step": 29706 }, { "epoch": 0.89, "learning_rate": 1.433779528457363e-07, "loss": 1.1777, "step": 29707 }, { "epoch": 0.89, "learning_rate": 1.4329654692521373e-07, "loss": 1.0418, "step": 29708 }, { "epoch": 0.89, "learning_rate": 1.432151634393733e-07, "loss": 0.9675, "step": 29709 }, { "epoch": 0.9, "learning_rate": 1.4313380238898944e-07, "loss": 1.0536, "step": 29710 }, { "epoch": 0.9, "learning_rate": 1.4305246377483706e-07, "loss": 1.113, "step": 29711 }, { "epoch": 0.9, "learning_rate": 1.4297114759768942e-07, "loss": 1.0818, "step": 29712 }, { "epoch": 0.9, "learning_rate": 1.428898538583215e-07, "loss": 1.1966, "step": 29713 }, { "epoch": 0.9, "learning_rate": 1.4280858255750706e-07, "loss": 1.1572, "step": 29714 }, { "epoch": 0.9, "learning_rate": 1.4272733369601944e-07, "loss": 1.0087, "step": 29715 }, { "epoch": 0.9, "learning_rate": 1.4264610727463268e-07, "loss": 1.1289, "step": 29716 }, { "epoch": 0.9, "learning_rate": 1.4256490329411954e-07, "loss": 1.0806, "step": 29717 }, { "epoch": 0.9, "learning_rate": 1.424837217552527e-07, "loss": 1.2351, "step": 29718 }, { "epoch": 0.9, "learning_rate": 1.4240256265880574e-07, "loss": 0.9594, "step": 29719 }, { "epoch": 0.9, "learning_rate": 1.423214260055511e-07, "loss": 1.0595, "step": 29720 }, { "epoch": 0.9, "learning_rate": 1.4224031179626092e-07, "loss": 0.98, "step": 29721 }, { "epoch": 0.9, "learning_rate": 1.4215922003170706e-07, "loss": 1.0563, "step": 29722 }, { "epoch": 0.9, "learning_rate": 1.4207815071266202e-07, "loss": 1.0415, "step": 29723 }, { "epoch": 0.9, "learning_rate": 1.4199710383989789e-07, "loss": 1.2224, "step": 29724 }, { "epoch": 0.9, "learning_rate": 1.4191607941418522e-07, "loss": 1.1351, "step": 29725 }, { "epoch": 0.9, "learning_rate": 1.418350774362956e-07, "loss": 1.014, "step": 29726 }, { "epoch": 0.9, "learning_rate": 1.4175409790700033e-07, "loss": 1.1104, "step": 29727 }, { "epoch": 0.9, "learning_rate": 1.416731408270705e-07, "loss": 1.061, "step": 29728 }, { "epoch": 0.9, "learning_rate": 1.4159220619727688e-07, "loss": 1.1669, "step": 29729 }, { "epoch": 0.9, "learning_rate": 1.415112940183891e-07, "loss": 1.1469, "step": 29730 }, { "epoch": 0.9, "learning_rate": 1.4143040429117792e-07, "loss": 0.9668, "step": 29731 }, { "epoch": 0.9, "learning_rate": 1.4134953701641364e-07, "loss": 1.1179, "step": 29732 }, { "epoch": 0.9, "learning_rate": 1.4126869219486555e-07, "loss": 1.2216, "step": 29733 }, { "epoch": 0.9, "learning_rate": 1.4118786982730336e-07, "loss": 1.0703, "step": 29734 }, { "epoch": 0.9, "learning_rate": 1.41107069914497e-07, "loss": 1.0509, "step": 29735 }, { "epoch": 0.9, "learning_rate": 1.4102629245721505e-07, "loss": 1.0854, "step": 29736 }, { "epoch": 0.9, "learning_rate": 1.4094553745622686e-07, "loss": 1.0212, "step": 29737 }, { "epoch": 0.9, "learning_rate": 1.4086480491230098e-07, "loss": 1.0967, "step": 29738 }, { "epoch": 0.9, "learning_rate": 1.407840948262057e-07, "loss": 1.2054, "step": 29739 }, { "epoch": 0.9, "learning_rate": 1.4070340719870983e-07, "loss": 1.0687, "step": 29740 }, { "epoch": 0.9, "learning_rate": 1.4062274203058085e-07, "loss": 1.0768, "step": 29741 }, { "epoch": 0.9, "learning_rate": 1.4054209932258784e-07, "loss": 1.1041, "step": 29742 }, { "epoch": 0.9, "learning_rate": 1.4046147907549713e-07, "loss": 1.2211, "step": 29743 }, { "epoch": 0.9, "learning_rate": 1.403808812900767e-07, "loss": 1.1409, "step": 29744 }, { "epoch": 0.9, "learning_rate": 1.4030030596709404e-07, "loss": 1.0749, "step": 29745 }, { "epoch": 0.9, "learning_rate": 1.402197531073163e-07, "loss": 1.0999, "step": 29746 }, { "epoch": 0.9, "learning_rate": 1.4013922271150947e-07, "loss": 1.2283, "step": 29747 }, { "epoch": 0.9, "learning_rate": 1.400587147804408e-07, "loss": 1.1044, "step": 29748 }, { "epoch": 0.9, "learning_rate": 1.3997822931487658e-07, "loss": 1.1366, "step": 29749 }, { "epoch": 0.9, "learning_rate": 1.3989776631558343e-07, "loss": 1.0577, "step": 29750 }, { "epoch": 0.9, "learning_rate": 1.398173257833263e-07, "loss": 1.0866, "step": 29751 }, { "epoch": 0.9, "learning_rate": 1.3973690771887176e-07, "loss": 1.0716, "step": 29752 }, { "epoch": 0.9, "learning_rate": 1.3965651212298508e-07, "loss": 1.1721, "step": 29753 }, { "epoch": 0.9, "learning_rate": 1.3957613899643146e-07, "loss": 1.1748, "step": 29754 }, { "epoch": 0.9, "learning_rate": 1.3949578833997668e-07, "loss": 1.0991, "step": 29755 }, { "epoch": 0.9, "learning_rate": 1.3941546015438484e-07, "loss": 1.1357, "step": 29756 }, { "epoch": 0.9, "learning_rate": 1.393351544404206e-07, "loss": 1.1342, "step": 29757 }, { "epoch": 0.9, "learning_rate": 1.3925487119884924e-07, "loss": 1.0144, "step": 29758 }, { "epoch": 0.9, "learning_rate": 1.3917461043043423e-07, "loss": 1.0049, "step": 29759 }, { "epoch": 0.9, "learning_rate": 1.3909437213594001e-07, "loss": 0.9422, "step": 29760 }, { "epoch": 0.9, "learning_rate": 1.3901415631613013e-07, "loss": 1.1197, "step": 29761 }, { "epoch": 0.9, "learning_rate": 1.389339629717684e-07, "loss": 1.0957, "step": 29762 }, { "epoch": 0.9, "learning_rate": 1.38853792103619e-07, "loss": 1.0463, "step": 29763 }, { "epoch": 0.9, "learning_rate": 1.3877364371244346e-07, "loss": 1.1302, "step": 29764 }, { "epoch": 0.9, "learning_rate": 1.3869351779900592e-07, "loss": 0.9821, "step": 29765 }, { "epoch": 0.9, "learning_rate": 1.3861341436406883e-07, "loss": 1.101, "step": 29766 }, { "epoch": 0.9, "learning_rate": 1.3853333340839464e-07, "loss": 1.0559, "step": 29767 }, { "epoch": 0.9, "learning_rate": 1.3845327493274608e-07, "loss": 1.1405, "step": 29768 }, { "epoch": 0.9, "learning_rate": 1.3837323893788473e-07, "loss": 1.1525, "step": 29769 }, { "epoch": 0.9, "learning_rate": 1.382932254245728e-07, "loss": 1.1342, "step": 29770 }, { "epoch": 0.9, "learning_rate": 1.3821323439357187e-07, "loss": 1.2176, "step": 29771 }, { "epoch": 0.9, "learning_rate": 1.3813326584564386e-07, "loss": 1.2067, "step": 29772 }, { "epoch": 0.9, "learning_rate": 1.380533197815495e-07, "loss": 1.2432, "step": 29773 }, { "epoch": 0.9, "learning_rate": 1.3797339620204965e-07, "loss": 1.0829, "step": 29774 }, { "epoch": 0.9, "learning_rate": 1.3789349510790556e-07, "loss": 1.1205, "step": 29775 }, { "epoch": 0.9, "learning_rate": 1.3781361649987806e-07, "loss": 1.1352, "step": 29776 }, { "epoch": 0.9, "learning_rate": 1.377337603787271e-07, "loss": 1.0632, "step": 29777 }, { "epoch": 0.9, "learning_rate": 1.3765392674521288e-07, "loss": 1.0717, "step": 29778 }, { "epoch": 0.9, "learning_rate": 1.3757411560009564e-07, "loss": 1.1218, "step": 29779 }, { "epoch": 0.9, "learning_rate": 1.3749432694413505e-07, "loss": 1.1862, "step": 29780 }, { "epoch": 0.9, "learning_rate": 1.374145607780908e-07, "loss": 1.0632, "step": 29781 }, { "epoch": 0.9, "learning_rate": 1.3733481710272194e-07, "loss": 1.0757, "step": 29782 }, { "epoch": 0.9, "learning_rate": 1.3725509591878767e-07, "loss": 1.0571, "step": 29783 }, { "epoch": 0.9, "learning_rate": 1.3717539722704675e-07, "loss": 1.1166, "step": 29784 }, { "epoch": 0.9, "learning_rate": 1.3709572102825836e-07, "loss": 1.0111, "step": 29785 }, { "epoch": 0.9, "learning_rate": 1.3701606732318046e-07, "loss": 1.0779, "step": 29786 }, { "epoch": 0.9, "learning_rate": 1.369364361125719e-07, "loss": 1.0186, "step": 29787 }, { "epoch": 0.9, "learning_rate": 1.3685682739719043e-07, "loss": 1.0568, "step": 29788 }, { "epoch": 0.9, "learning_rate": 1.3677724117779344e-07, "loss": 1.0942, "step": 29789 }, { "epoch": 0.9, "learning_rate": 1.36697677455139e-07, "loss": 1.1774, "step": 29790 }, { "epoch": 0.9, "learning_rate": 1.3661813622998454e-07, "loss": 1.0518, "step": 29791 }, { "epoch": 0.9, "learning_rate": 1.3653861750308721e-07, "loss": 1.0717, "step": 29792 }, { "epoch": 0.9, "learning_rate": 1.3645912127520421e-07, "loss": 1.204, "step": 29793 }, { "epoch": 0.9, "learning_rate": 1.3637964754709188e-07, "loss": 1.0245, "step": 29794 }, { "epoch": 0.9, "learning_rate": 1.363001963195068e-07, "loss": 1.1149, "step": 29795 }, { "epoch": 0.9, "learning_rate": 1.3622076759320535e-07, "loss": 1.0565, "step": 29796 }, { "epoch": 0.9, "learning_rate": 1.3614136136894385e-07, "loss": 1.0038, "step": 29797 }, { "epoch": 0.9, "learning_rate": 1.3606197764747864e-07, "loss": 1.1523, "step": 29798 }, { "epoch": 0.9, "learning_rate": 1.3598261642956439e-07, "loss": 1.1594, "step": 29799 }, { "epoch": 0.9, "learning_rate": 1.359032777159569e-07, "loss": 1.0269, "step": 29800 }, { "epoch": 0.9, "learning_rate": 1.3582396150741194e-07, "loss": 1.0193, "step": 29801 }, { "epoch": 0.9, "learning_rate": 1.357446678046845e-07, "loss": 1.0195, "step": 29802 }, { "epoch": 0.9, "learning_rate": 1.356653966085286e-07, "loss": 0.9905, "step": 29803 }, { "epoch": 0.9, "learning_rate": 1.355861479196996e-07, "loss": 0.9924, "step": 29804 }, { "epoch": 0.9, "learning_rate": 1.355069217389518e-07, "loss": 1.1003, "step": 29805 }, { "epoch": 0.9, "learning_rate": 1.3542771806703964e-07, "loss": 1.1268, "step": 29806 }, { "epoch": 0.9, "learning_rate": 1.3534853690471638e-07, "loss": 1.1008, "step": 29807 }, { "epoch": 0.9, "learning_rate": 1.3526937825273617e-07, "loss": 1.0294, "step": 29808 }, { "epoch": 0.9, "learning_rate": 1.3519024211185257e-07, "loss": 1.0906, "step": 29809 }, { "epoch": 0.9, "learning_rate": 1.3511112848281882e-07, "loss": 1.1038, "step": 29810 }, { "epoch": 0.9, "learning_rate": 1.350320373663888e-07, "loss": 1.2338, "step": 29811 }, { "epoch": 0.9, "learning_rate": 1.3495296876331443e-07, "loss": 1.157, "step": 29812 }, { "epoch": 0.9, "learning_rate": 1.348739226743484e-07, "loss": 1.1795, "step": 29813 }, { "epoch": 0.9, "learning_rate": 1.3479489910024374e-07, "loss": 1.138, "step": 29814 }, { "epoch": 0.9, "learning_rate": 1.347158980417526e-07, "loss": 0.9577, "step": 29815 }, { "epoch": 0.9, "learning_rate": 1.3463691949962692e-07, "loss": 1.1354, "step": 29816 }, { "epoch": 0.9, "learning_rate": 1.3455796347461858e-07, "loss": 1.2133, "step": 29817 }, { "epoch": 0.9, "learning_rate": 1.344790299674792e-07, "loss": 1.0483, "step": 29818 }, { "epoch": 0.9, "learning_rate": 1.3440011897896038e-07, "loss": 1.1302, "step": 29819 }, { "epoch": 0.9, "learning_rate": 1.3432123050981295e-07, "loss": 1.0431, "step": 29820 }, { "epoch": 0.9, "learning_rate": 1.3424236456078792e-07, "loss": 1.0123, "step": 29821 }, { "epoch": 0.9, "learning_rate": 1.3416352113263614e-07, "loss": 1.1069, "step": 29822 }, { "epoch": 0.9, "learning_rate": 1.3408470022610837e-07, "loss": 1.1375, "step": 29823 }, { "epoch": 0.9, "learning_rate": 1.3400590184195512e-07, "loss": 1.0942, "step": 29824 }, { "epoch": 0.9, "learning_rate": 1.3392712598092578e-07, "loss": 1.1742, "step": 29825 }, { "epoch": 0.9, "learning_rate": 1.338483726437706e-07, "loss": 0.9976, "step": 29826 }, { "epoch": 0.9, "learning_rate": 1.3376964183123952e-07, "loss": 1.1611, "step": 29827 }, { "epoch": 0.9, "learning_rate": 1.3369093354408198e-07, "loss": 0.9938, "step": 29828 }, { "epoch": 0.9, "learning_rate": 1.3361224778304677e-07, "loss": 1.0641, "step": 29829 }, { "epoch": 0.9, "learning_rate": 1.3353358454888332e-07, "loss": 1.1257, "step": 29830 }, { "epoch": 0.9, "learning_rate": 1.3345494384234047e-07, "loss": 1.1158, "step": 29831 }, { "epoch": 0.9, "learning_rate": 1.333763256641671e-07, "loss": 1.0113, "step": 29832 }, { "epoch": 0.9, "learning_rate": 1.3329773001511115e-07, "loss": 1.0514, "step": 29833 }, { "epoch": 0.9, "learning_rate": 1.3321915689592068e-07, "loss": 1.1207, "step": 29834 }, { "epoch": 0.9, "learning_rate": 1.33140606307344e-07, "loss": 0.9637, "step": 29835 }, { "epoch": 0.9, "learning_rate": 1.330620782501288e-07, "loss": 1.0579, "step": 29836 }, { "epoch": 0.9, "learning_rate": 1.329835727250231e-07, "loss": 1.259, "step": 29837 }, { "epoch": 0.9, "learning_rate": 1.3290508973277354e-07, "loss": 1.0819, "step": 29838 }, { "epoch": 0.9, "learning_rate": 1.3282662927412732e-07, "loss": 1.1464, "step": 29839 }, { "epoch": 0.9, "learning_rate": 1.327481913498316e-07, "loss": 0.9977, "step": 29840 }, { "epoch": 0.9, "learning_rate": 1.3266977596063297e-07, "loss": 1.0244, "step": 29841 }, { "epoch": 0.9, "learning_rate": 1.3259138310727808e-07, "loss": 1.0036, "step": 29842 }, { "epoch": 0.9, "learning_rate": 1.3251301279051278e-07, "loss": 1.1151, "step": 29843 }, { "epoch": 0.9, "learning_rate": 1.324346650110836e-07, "loss": 1.0162, "step": 29844 }, { "epoch": 0.9, "learning_rate": 1.3235633976973638e-07, "loss": 1.1031, "step": 29845 }, { "epoch": 0.9, "learning_rate": 1.322780370672161e-07, "loss": 1.1884, "step": 29846 }, { "epoch": 0.9, "learning_rate": 1.3219975690426878e-07, "loss": 1.2017, "step": 29847 }, { "epoch": 0.9, "learning_rate": 1.3212149928163915e-07, "loss": 1.1107, "step": 29848 }, { "epoch": 0.9, "learning_rate": 1.320432642000727e-07, "loss": 1.1879, "step": 29849 }, { "epoch": 0.9, "learning_rate": 1.319650516603141e-07, "loss": 1.1085, "step": 29850 }, { "epoch": 0.9, "learning_rate": 1.318868616631072e-07, "loss": 1.0723, "step": 29851 }, { "epoch": 0.9, "learning_rate": 1.3180869420919727e-07, "loss": 1.0916, "step": 29852 }, { "epoch": 0.9, "learning_rate": 1.317305492993276e-07, "loss": 1.0322, "step": 29853 }, { "epoch": 0.9, "learning_rate": 1.3165242693424312e-07, "loss": 1.1782, "step": 29854 }, { "epoch": 0.9, "learning_rate": 1.315743271146866e-07, "loss": 1.1567, "step": 29855 }, { "epoch": 0.9, "learning_rate": 1.3149624984140159e-07, "loss": 1.2115, "step": 29856 }, { "epoch": 0.9, "learning_rate": 1.3141819511513164e-07, "loss": 1.1057, "step": 29857 }, { "epoch": 0.9, "learning_rate": 1.3134016293662012e-07, "loss": 1.0695, "step": 29858 }, { "epoch": 0.9, "learning_rate": 1.3126215330660912e-07, "loss": 1.0395, "step": 29859 }, { "epoch": 0.9, "learning_rate": 1.3118416622584173e-07, "loss": 1.0439, "step": 29860 }, { "epoch": 0.9, "learning_rate": 1.3110620169506012e-07, "loss": 1.0255, "step": 29861 }, { "epoch": 0.9, "learning_rate": 1.3102825971500644e-07, "loss": 1.0933, "step": 29862 }, { "epoch": 0.9, "learning_rate": 1.3095034028642317e-07, "loss": 1.0648, "step": 29863 }, { "epoch": 0.9, "learning_rate": 1.308724434100514e-07, "loss": 1.0623, "step": 29864 }, { "epoch": 0.9, "learning_rate": 1.3079456908663302e-07, "loss": 1.0715, "step": 29865 }, { "epoch": 0.9, "learning_rate": 1.3071671731690912e-07, "loss": 1.0457, "step": 29866 }, { "epoch": 0.9, "learning_rate": 1.30638888101621e-07, "loss": 1.1267, "step": 29867 }, { "epoch": 0.9, "learning_rate": 1.305610814415098e-07, "loss": 1.1457, "step": 29868 }, { "epoch": 0.9, "learning_rate": 1.3048329733731574e-07, "loss": 1.1349, "step": 29869 }, { "epoch": 0.9, "learning_rate": 1.304055357897799e-07, "loss": 1.1714, "step": 29870 }, { "epoch": 0.9, "learning_rate": 1.3032779679964164e-07, "loss": 1.0401, "step": 29871 }, { "epoch": 0.9, "learning_rate": 1.3025008036764154e-07, "loss": 1.0316, "step": 29872 }, { "epoch": 0.9, "learning_rate": 1.3017238649451952e-07, "loss": 1.076, "step": 29873 }, { "epoch": 0.9, "learning_rate": 1.3009471518101502e-07, "loss": 1.1362, "step": 29874 }, { "epoch": 0.9, "learning_rate": 1.3001706642786715e-07, "loss": 1.2112, "step": 29875 }, { "epoch": 0.9, "learning_rate": 1.299394402358159e-07, "loss": 1.0878, "step": 29876 }, { "epoch": 0.9, "learning_rate": 1.2986183660559954e-07, "loss": 1.0638, "step": 29877 }, { "epoch": 0.9, "learning_rate": 1.2978425553795692e-07, "loss": 1.0668, "step": 29878 }, { "epoch": 0.9, "learning_rate": 1.2970669703362665e-07, "loss": 1.0538, "step": 29879 }, { "epoch": 0.9, "learning_rate": 1.2962916109334727e-07, "loss": 1.109, "step": 29880 }, { "epoch": 0.9, "learning_rate": 1.2955164771785628e-07, "loss": 1.1649, "step": 29881 }, { "epoch": 0.9, "learning_rate": 1.2947415690789223e-07, "loss": 1.1088, "step": 29882 }, { "epoch": 0.9, "learning_rate": 1.293966886641923e-07, "loss": 1.0913, "step": 29883 }, { "epoch": 0.9, "learning_rate": 1.2931924298749454e-07, "loss": 1.1545, "step": 29884 }, { "epoch": 0.9, "learning_rate": 1.2924181987853558e-07, "loss": 1.1486, "step": 29885 }, { "epoch": 0.9, "learning_rate": 1.2916441933805256e-07, "loss": 1.1802, "step": 29886 }, { "epoch": 0.9, "learning_rate": 1.2908704136678246e-07, "loss": 1.1425, "step": 29887 }, { "epoch": 0.9, "learning_rate": 1.2900968596546188e-07, "loss": 1.0375, "step": 29888 }, { "epoch": 0.9, "learning_rate": 1.289323531348277e-07, "loss": 1.0742, "step": 29889 }, { "epoch": 0.9, "learning_rate": 1.2885504287561495e-07, "loss": 1.1726, "step": 29890 }, { "epoch": 0.9, "learning_rate": 1.287777551885605e-07, "loss": 1.1285, "step": 29891 }, { "epoch": 0.9, "learning_rate": 1.287004900743996e-07, "loss": 1.2369, "step": 29892 }, { "epoch": 0.9, "learning_rate": 1.2862324753386835e-07, "loss": 1.2358, "step": 29893 }, { "epoch": 0.9, "learning_rate": 1.285460275677014e-07, "loss": 1.1302, "step": 29894 }, { "epoch": 0.9, "learning_rate": 1.2846883017663403e-07, "loss": 1.0162, "step": 29895 }, { "epoch": 0.9, "learning_rate": 1.2839165536140148e-07, "loss": 1.1655, "step": 29896 }, { "epoch": 0.9, "learning_rate": 1.2831450312273785e-07, "loss": 1.0595, "step": 29897 }, { "epoch": 0.9, "learning_rate": 1.2823737346137815e-07, "loss": 1.1299, "step": 29898 }, { "epoch": 0.9, "learning_rate": 1.2816026637805623e-07, "loss": 1.0855, "step": 29899 }, { "epoch": 0.9, "learning_rate": 1.280831818735062e-07, "loss": 1.0115, "step": 29900 }, { "epoch": 0.9, "learning_rate": 1.2800611994846196e-07, "loss": 1.0547, "step": 29901 }, { "epoch": 0.9, "learning_rate": 1.279290806036576e-07, "loss": 0.9868, "step": 29902 }, { "epoch": 0.9, "learning_rate": 1.2785206383982535e-07, "loss": 0.9448, "step": 29903 }, { "epoch": 0.9, "learning_rate": 1.277750696576993e-07, "loss": 1.0219, "step": 29904 }, { "epoch": 0.9, "learning_rate": 1.276980980580117e-07, "loss": 1.0599, "step": 29905 }, { "epoch": 0.9, "learning_rate": 1.2762114904149637e-07, "loss": 1.0958, "step": 29906 }, { "epoch": 0.9, "learning_rate": 1.2754422260888466e-07, "loss": 1.1199, "step": 29907 }, { "epoch": 0.9, "learning_rate": 1.2746731876090907e-07, "loss": 1.1342, "step": 29908 }, { "epoch": 0.9, "learning_rate": 1.273904374983023e-07, "loss": 1.2, "step": 29909 }, { "epoch": 0.9, "learning_rate": 1.2731357882179608e-07, "loss": 1.0284, "step": 29910 }, { "epoch": 0.9, "learning_rate": 1.2723674273212166e-07, "loss": 1.1088, "step": 29911 }, { "epoch": 0.9, "learning_rate": 1.2715992923001046e-07, "loss": 1.1134, "step": 29912 }, { "epoch": 0.9, "learning_rate": 1.2708313831619412e-07, "loss": 1.1433, "step": 29913 }, { "epoch": 0.9, "learning_rate": 1.2700636999140342e-07, "loss": 1.1089, "step": 29914 }, { "epoch": 0.9, "learning_rate": 1.2692962425636945e-07, "loss": 1.0308, "step": 29915 }, { "epoch": 0.9, "learning_rate": 1.2685290111182218e-07, "loss": 1.042, "step": 29916 }, { "epoch": 0.9, "learning_rate": 1.2677620055849272e-07, "loss": 1.1526, "step": 29917 }, { "epoch": 0.9, "learning_rate": 1.2669952259711043e-07, "loss": 1.0898, "step": 29918 }, { "epoch": 0.9, "learning_rate": 1.2662286722840617e-07, "loss": 1.0491, "step": 29919 }, { "epoch": 0.9, "learning_rate": 1.2654623445310876e-07, "loss": 1.0739, "step": 29920 }, { "epoch": 0.9, "learning_rate": 1.264696242719482e-07, "loss": 1.0835, "step": 29921 }, { "epoch": 0.9, "learning_rate": 1.2639303668565362e-07, "loss": 1.0686, "step": 29922 }, { "epoch": 0.9, "learning_rate": 1.2631647169495416e-07, "loss": 1.0155, "step": 29923 }, { "epoch": 0.9, "learning_rate": 1.2623992930057865e-07, "loss": 1.0833, "step": 29924 }, { "epoch": 0.9, "learning_rate": 1.2616340950325572e-07, "loss": 1.2207, "step": 29925 }, { "epoch": 0.9, "learning_rate": 1.2608691230371394e-07, "loss": 1.0942, "step": 29926 }, { "epoch": 0.9, "learning_rate": 1.2601043770268162e-07, "loss": 1.0275, "step": 29927 }, { "epoch": 0.9, "learning_rate": 1.2593398570088678e-07, "loss": 1.031, "step": 29928 }, { "epoch": 0.9, "learning_rate": 1.258575562990566e-07, "loss": 1.1374, "step": 29929 }, { "epoch": 0.9, "learning_rate": 1.2578114949791886e-07, "loss": 1.0054, "step": 29930 }, { "epoch": 0.9, "learning_rate": 1.2570476529820157e-07, "loss": 1.1519, "step": 29931 }, { "epoch": 0.9, "learning_rate": 1.256284037006314e-07, "loss": 1.0093, "step": 29932 }, { "epoch": 0.9, "learning_rate": 1.2555206470593524e-07, "loss": 0.9506, "step": 29933 }, { "epoch": 0.9, "learning_rate": 1.2547574831483944e-07, "loss": 1.0383, "step": 29934 }, { "epoch": 0.9, "learning_rate": 1.2539945452807123e-07, "loss": 1.0469, "step": 29935 }, { "epoch": 0.9, "learning_rate": 1.2532318334635695e-07, "loss": 1.1785, "step": 29936 }, { "epoch": 0.9, "learning_rate": 1.252469347704216e-07, "loss": 1.2156, "step": 29937 }, { "epoch": 0.9, "learning_rate": 1.2517070880099208e-07, "loss": 1.0858, "step": 29938 }, { "epoch": 0.9, "learning_rate": 1.2509450543879338e-07, "loss": 1.0344, "step": 29939 }, { "epoch": 0.9, "learning_rate": 1.2501832468455154e-07, "loss": 1.0657, "step": 29940 }, { "epoch": 0.9, "learning_rate": 1.2494216653899134e-07, "loss": 1.1002, "step": 29941 }, { "epoch": 0.9, "learning_rate": 1.2486603100283767e-07, "loss": 1.117, "step": 29942 }, { "epoch": 0.9, "learning_rate": 1.2478991807681555e-07, "loss": 1.1832, "step": 29943 }, { "epoch": 0.9, "learning_rate": 1.2471382776164943e-07, "loss": 1.0341, "step": 29944 }, { "epoch": 0.9, "learning_rate": 1.2463776005806422e-07, "loss": 1.0775, "step": 29945 }, { "epoch": 0.9, "learning_rate": 1.24561714966783e-07, "loss": 1.0898, "step": 29946 }, { "epoch": 0.9, "learning_rate": 1.2448569248853016e-07, "loss": 1.1509, "step": 29947 }, { "epoch": 0.9, "learning_rate": 1.244096926240296e-07, "loss": 1.0631, "step": 29948 }, { "epoch": 0.9, "learning_rate": 1.243337153740043e-07, "loss": 1.2437, "step": 29949 }, { "epoch": 0.9, "learning_rate": 1.2425776073917818e-07, "loss": 1.1146, "step": 29950 }, { "epoch": 0.9, "learning_rate": 1.2418182872027397e-07, "loss": 1.0345, "step": 29951 }, { "epoch": 0.9, "learning_rate": 1.241059193180144e-07, "loss": 1.1341, "step": 29952 }, { "epoch": 0.9, "learning_rate": 1.2403003253312258e-07, "loss": 1.0469, "step": 29953 }, { "epoch": 0.9, "learning_rate": 1.2395416836632007e-07, "loss": 1.1314, "step": 29954 }, { "epoch": 0.9, "learning_rate": 1.2387832681832968e-07, "loss": 1.1118, "step": 29955 }, { "epoch": 0.9, "learning_rate": 1.238025078898733e-07, "loss": 1.1094, "step": 29956 }, { "epoch": 0.9, "learning_rate": 1.237267115816726e-07, "loss": 1.1192, "step": 29957 }, { "epoch": 0.9, "learning_rate": 1.236509378944495e-07, "loss": 1.1899, "step": 29958 }, { "epoch": 0.9, "learning_rate": 1.235751868289245e-07, "loss": 1.0851, "step": 29959 }, { "epoch": 0.9, "learning_rate": 1.2349945838581928e-07, "loss": 1.0416, "step": 29960 }, { "epoch": 0.9, "learning_rate": 1.2342375256585465e-07, "loss": 1.0745, "step": 29961 }, { "epoch": 0.9, "learning_rate": 1.2334806936975168e-07, "loss": 1.0782, "step": 29962 }, { "epoch": 0.9, "learning_rate": 1.232724087982301e-07, "loss": 1.1011, "step": 29963 }, { "epoch": 0.9, "learning_rate": 1.231967708520107e-07, "loss": 0.9847, "step": 29964 }, { "epoch": 0.9, "learning_rate": 1.2312115553181293e-07, "loss": 1.0198, "step": 29965 }, { "epoch": 0.9, "learning_rate": 1.2304556283835727e-07, "loss": 1.0764, "step": 29966 }, { "epoch": 0.9, "learning_rate": 1.229699927723635e-07, "loss": 1.0841, "step": 29967 }, { "epoch": 0.9, "learning_rate": 1.2289444533455013e-07, "loss": 1.1717, "step": 29968 }, { "epoch": 0.9, "learning_rate": 1.2281892052563666e-07, "loss": 1.1828, "step": 29969 }, { "epoch": 0.9, "learning_rate": 1.2274341834634246e-07, "loss": 1.1138, "step": 29970 }, { "epoch": 0.9, "learning_rate": 1.2266793879738613e-07, "loss": 1.0284, "step": 29971 }, { "epoch": 0.9, "learning_rate": 1.2259248187948576e-07, "loss": 1.1899, "step": 29972 }, { "epoch": 0.9, "learning_rate": 1.2251704759335986e-07, "loss": 1.0279, "step": 29973 }, { "epoch": 0.9, "learning_rate": 1.224416359397268e-07, "loss": 1.1339, "step": 29974 }, { "epoch": 0.9, "learning_rate": 1.223662469193046e-07, "loss": 1.1258, "step": 29975 }, { "epoch": 0.9, "learning_rate": 1.2229088053281017e-07, "loss": 1.1218, "step": 29976 }, { "epoch": 0.9, "learning_rate": 1.2221553678096133e-07, "loss": 1.1778, "step": 29977 }, { "epoch": 0.9, "learning_rate": 1.2214021566447577e-07, "loss": 1.0186, "step": 29978 }, { "epoch": 0.9, "learning_rate": 1.2206491718406989e-07, "loss": 1.0687, "step": 29979 }, { "epoch": 0.9, "learning_rate": 1.219896413404606e-07, "loss": 1.0727, "step": 29980 }, { "epoch": 0.9, "learning_rate": 1.2191438813436486e-07, "loss": 1.1129, "step": 29981 }, { "epoch": 0.9, "learning_rate": 1.2183915756649873e-07, "loss": 0.9695, "step": 29982 }, { "epoch": 0.9, "learning_rate": 1.217639496375786e-07, "loss": 1.1434, "step": 29983 }, { "epoch": 0.9, "learning_rate": 1.2168876434832056e-07, "loss": 0.9997, "step": 29984 }, { "epoch": 0.9, "learning_rate": 1.2161360169943958e-07, "loss": 1.0587, "step": 29985 }, { "epoch": 0.9, "learning_rate": 1.2153846169165178e-07, "loss": 1.0972, "step": 29986 }, { "epoch": 0.9, "learning_rate": 1.2146334432567214e-07, "loss": 1.1393, "step": 29987 }, { "epoch": 0.9, "learning_rate": 1.2138824960221645e-07, "loss": 1.132, "step": 29988 }, { "epoch": 0.9, "learning_rate": 1.2131317752199861e-07, "loss": 1.1367, "step": 29989 }, { "epoch": 0.9, "learning_rate": 1.2123812808573387e-07, "loss": 1.0844, "step": 29990 }, { "epoch": 0.9, "learning_rate": 1.2116310129413638e-07, "loss": 1.1554, "step": 29991 }, { "epoch": 0.9, "learning_rate": 1.2108809714792087e-07, "loss": 1.2034, "step": 29992 }, { "epoch": 0.9, "learning_rate": 1.2101311564780034e-07, "loss": 1.3423, "step": 29993 }, { "epoch": 0.9, "learning_rate": 1.209381567944895e-07, "loss": 1.2115, "step": 29994 }, { "epoch": 0.9, "learning_rate": 1.2086322058870142e-07, "loss": 1.1189, "step": 29995 }, { "epoch": 0.9, "learning_rate": 1.2078830703114967e-07, "loss": 1.0844, "step": 29996 }, { "epoch": 0.9, "learning_rate": 1.2071341612254788e-07, "loss": 1.0754, "step": 29997 }, { "epoch": 0.9, "learning_rate": 1.2063854786360795e-07, "loss": 1.0289, "step": 29998 }, { "epoch": 0.9, "learning_rate": 1.205637022550432e-07, "loss": 1.1599, "step": 29999 }, { "epoch": 0.9, "learning_rate": 1.2048887929756614e-07, "loss": 1.1059, "step": 30000 }, { "epoch": 0.9, "learning_rate": 1.2041407899188895e-07, "loss": 1.1181, "step": 30001 }, { "epoch": 0.9, "learning_rate": 1.2033930133872356e-07, "loss": 1.0063, "step": 30002 }, { "epoch": 0.9, "learning_rate": 1.2026454633878194e-07, "loss": 1.0369, "step": 30003 }, { "epoch": 0.9, "learning_rate": 1.201898139927757e-07, "loss": 1.152, "step": 30004 }, { "epoch": 0.9, "learning_rate": 1.2011510430141622e-07, "loss": 1.1018, "step": 30005 }, { "epoch": 0.9, "learning_rate": 1.2004041726541487e-07, "loss": 1.1316, "step": 30006 }, { "epoch": 0.9, "learning_rate": 1.199657528854825e-07, "loss": 1.0516, "step": 30007 }, { "epoch": 0.9, "learning_rate": 1.1989111116232966e-07, "loss": 1.0403, "step": 30008 }, { "epoch": 0.9, "learning_rate": 1.198164920966674e-07, "loss": 1.2139, "step": 30009 }, { "epoch": 0.9, "learning_rate": 1.1974189568920602e-07, "loss": 1.0143, "step": 30010 }, { "epoch": 0.9, "learning_rate": 1.1966732194065522e-07, "loss": 1.1433, "step": 30011 }, { "epoch": 0.9, "learning_rate": 1.19592770851725e-07, "loss": 1.1647, "step": 30012 }, { "epoch": 0.9, "learning_rate": 1.195182424231253e-07, "loss": 1.0352, "step": 30013 }, { "epoch": 0.9, "learning_rate": 1.1944373665556564e-07, "loss": 1.0272, "step": 30014 }, { "epoch": 0.9, "learning_rate": 1.193692535497548e-07, "loss": 1.0472, "step": 30015 }, { "epoch": 0.9, "learning_rate": 1.1929479310640203e-07, "loss": 1.1987, "step": 30016 }, { "epoch": 0.9, "learning_rate": 1.192203553262164e-07, "loss": 1.1168, "step": 30017 }, { "epoch": 0.9, "learning_rate": 1.1914594020990655e-07, "loss": 1.2404, "step": 30018 }, { "epoch": 0.9, "learning_rate": 1.1907154775818026e-07, "loss": 1.2094, "step": 30019 }, { "epoch": 0.9, "learning_rate": 1.1899717797174637e-07, "loss": 1.0231, "step": 30020 }, { "epoch": 0.9, "learning_rate": 1.189228308513124e-07, "loss": 1.1437, "step": 30021 }, { "epoch": 0.9, "learning_rate": 1.1884850639758667e-07, "loss": 1.0867, "step": 30022 }, { "epoch": 0.9, "learning_rate": 1.1877420461127636e-07, "loss": 1.0322, "step": 30023 }, { "epoch": 0.9, "learning_rate": 1.1869992549308845e-07, "loss": 1.144, "step": 30024 }, { "epoch": 0.9, "learning_rate": 1.1862566904373068e-07, "loss": 0.9772, "step": 30025 }, { "epoch": 0.9, "learning_rate": 1.1855143526390944e-07, "loss": 1.1503, "step": 30026 }, { "epoch": 0.9, "learning_rate": 1.1847722415433193e-07, "loss": 1.1447, "step": 30027 }, { "epoch": 0.9, "learning_rate": 1.18403035715704e-07, "loss": 1.0629, "step": 30028 }, { "epoch": 0.9, "learning_rate": 1.18328869948732e-07, "loss": 1.1633, "step": 30029 }, { "epoch": 0.9, "learning_rate": 1.1825472685412204e-07, "loss": 1.0452, "step": 30030 }, { "epoch": 0.9, "learning_rate": 1.1818060643258022e-07, "loss": 1.0978, "step": 30031 }, { "epoch": 0.9, "learning_rate": 1.1810650868481183e-07, "loss": 1.0995, "step": 30032 }, { "epoch": 0.9, "learning_rate": 1.1803243361152239e-07, "loss": 1.1071, "step": 30033 }, { "epoch": 0.9, "learning_rate": 1.1795838121341691e-07, "loss": 1.1386, "step": 30034 }, { "epoch": 0.9, "learning_rate": 1.1788435149120064e-07, "loss": 1.0488, "step": 30035 }, { "epoch": 0.9, "learning_rate": 1.1781034444557776e-07, "loss": 1.0903, "step": 30036 }, { "epoch": 0.9, "learning_rate": 1.1773636007725325e-07, "loss": 1.0414, "step": 30037 }, { "epoch": 0.9, "learning_rate": 1.1766239838693128e-07, "loss": 1.0726, "step": 30038 }, { "epoch": 0.9, "learning_rate": 1.1758845937531571e-07, "loss": 1.1637, "step": 30039 }, { "epoch": 0.9, "learning_rate": 1.17514543043111e-07, "loss": 1.1257, "step": 30040 }, { "epoch": 0.9, "learning_rate": 1.1744064939102018e-07, "loss": 1.1379, "step": 30041 }, { "epoch": 0.91, "learning_rate": 1.1736677841974687e-07, "loss": 1.2188, "step": 30042 }, { "epoch": 0.91, "learning_rate": 1.172929301299941e-07, "loss": 1.1658, "step": 30043 }, { "epoch": 0.91, "learning_rate": 1.1721910452246577e-07, "loss": 1.1807, "step": 30044 }, { "epoch": 0.91, "learning_rate": 1.1714530159786325e-07, "loss": 1.195, "step": 30045 }, { "epoch": 0.91, "learning_rate": 1.1707152135689015e-07, "loss": 1.1077, "step": 30046 }, { "epoch": 0.91, "learning_rate": 1.169977638002484e-07, "loss": 1.0818, "step": 30047 }, { "epoch": 0.91, "learning_rate": 1.1692402892864025e-07, "loss": 1.1751, "step": 30048 }, { "epoch": 0.91, "learning_rate": 1.1685031674276786e-07, "loss": 1.1019, "step": 30049 }, { "epoch": 0.91, "learning_rate": 1.1677662724333238e-07, "loss": 1.1711, "step": 30050 }, { "epoch": 0.91, "learning_rate": 1.1670296043103574e-07, "loss": 1.1219, "step": 30051 }, { "epoch": 0.91, "learning_rate": 1.1662931630657904e-07, "loss": 1.0776, "step": 30052 }, { "epoch": 0.91, "learning_rate": 1.1655569487066365e-07, "loss": 1.1326, "step": 30053 }, { "epoch": 0.91, "learning_rate": 1.1648209612398986e-07, "loss": 1.1784, "step": 30054 }, { "epoch": 0.91, "learning_rate": 1.164085200672585e-07, "loss": 1.1161, "step": 30055 }, { "epoch": 0.91, "learning_rate": 1.1633496670117011e-07, "loss": 1.0923, "step": 30056 }, { "epoch": 0.91, "learning_rate": 1.1626143602642526e-07, "loss": 1.0942, "step": 30057 }, { "epoch": 0.91, "learning_rate": 1.1618792804372308e-07, "loss": 1.2051, "step": 30058 }, { "epoch": 0.91, "learning_rate": 1.161144427537636e-07, "loss": 1.007, "step": 30059 }, { "epoch": 0.91, "learning_rate": 1.1604098015724653e-07, "loss": 1.0847, "step": 30060 }, { "epoch": 0.91, "learning_rate": 1.1596754025487128e-07, "loss": 1.1364, "step": 30061 }, { "epoch": 0.91, "learning_rate": 1.1589412304733705e-07, "loss": 1.1619, "step": 30062 }, { "epoch": 0.91, "learning_rate": 1.1582072853534216e-07, "loss": 1.1634, "step": 30063 }, { "epoch": 0.91, "learning_rate": 1.1574735671958603e-07, "loss": 1.0276, "step": 30064 }, { "epoch": 0.91, "learning_rate": 1.1567400760076648e-07, "loss": 1.0551, "step": 30065 }, { "epoch": 0.91, "learning_rate": 1.1560068117958234e-07, "loss": 1.1418, "step": 30066 }, { "epoch": 0.91, "learning_rate": 1.1552737745673115e-07, "loss": 1.0754, "step": 30067 }, { "epoch": 0.91, "learning_rate": 1.1545409643291094e-07, "loss": 1.2084, "step": 30068 }, { "epoch": 0.91, "learning_rate": 1.153808381088195e-07, "loss": 1.0921, "step": 30069 }, { "epoch": 0.91, "learning_rate": 1.1530760248515404e-07, "loss": 1.0364, "step": 30070 }, { "epoch": 0.91, "learning_rate": 1.1523438956261152e-07, "loss": 1.1009, "step": 30071 }, { "epoch": 0.91, "learning_rate": 1.1516119934188885e-07, "loss": 1.1877, "step": 30072 }, { "epoch": 0.91, "learning_rate": 1.1508803182368328e-07, "loss": 1.1906, "step": 30073 }, { "epoch": 0.91, "learning_rate": 1.150148870086909e-07, "loss": 0.9792, "step": 30074 }, { "epoch": 0.91, "learning_rate": 1.1494176489760839e-07, "loss": 1.1789, "step": 30075 }, { "epoch": 0.91, "learning_rate": 1.148686654911313e-07, "loss": 1.0574, "step": 30076 }, { "epoch": 0.91, "learning_rate": 1.1479558878995601e-07, "loss": 1.0323, "step": 30077 }, { "epoch": 0.91, "learning_rate": 1.147225347947778e-07, "loss": 1.1774, "step": 30078 }, { "epoch": 0.91, "learning_rate": 1.146495035062925e-07, "loss": 1.0082, "step": 30079 }, { "epoch": 0.91, "learning_rate": 1.1457649492519484e-07, "loss": 1.1264, "step": 30080 }, { "epoch": 0.91, "learning_rate": 1.1450350905218011e-07, "loss": 1.1104, "step": 30081 }, { "epoch": 0.91, "learning_rate": 1.14430545887943e-07, "loss": 1.0831, "step": 30082 }, { "epoch": 0.91, "learning_rate": 1.1435760543317881e-07, "loss": 1.1395, "step": 30083 }, { "epoch": 0.91, "learning_rate": 1.1428468768858058e-07, "loss": 1.0284, "step": 30084 }, { "epoch": 0.91, "learning_rate": 1.1421179265484333e-07, "loss": 1.1282, "step": 30085 }, { "epoch": 0.91, "learning_rate": 1.1413892033266066e-07, "loss": 1.1411, "step": 30086 }, { "epoch": 0.91, "learning_rate": 1.1406607072272619e-07, "loss": 1.212, "step": 30087 }, { "epoch": 0.91, "learning_rate": 1.1399324382573407e-07, "loss": 0.9887, "step": 30088 }, { "epoch": 0.91, "learning_rate": 1.1392043964237681e-07, "loss": 1.1452, "step": 30089 }, { "epoch": 0.91, "learning_rate": 1.1384765817334802e-07, "loss": 1.1702, "step": 30090 }, { "epoch": 0.91, "learning_rate": 1.1377489941933994e-07, "loss": 1.1761, "step": 30091 }, { "epoch": 0.91, "learning_rate": 1.1370216338104617e-07, "loss": 1.1677, "step": 30092 }, { "epoch": 0.91, "learning_rate": 1.1362945005915838e-07, "loss": 1.1571, "step": 30093 }, { "epoch": 0.91, "learning_rate": 1.135567594543685e-07, "loss": 1.1685, "step": 30094 }, { "epoch": 0.91, "learning_rate": 1.1348409156736906e-07, "loss": 1.0127, "step": 30095 }, { "epoch": 0.91, "learning_rate": 1.1341144639885226e-07, "loss": 0.9685, "step": 30096 }, { "epoch": 0.91, "learning_rate": 1.1333882394950841e-07, "loss": 1.0914, "step": 30097 }, { "epoch": 0.91, "learning_rate": 1.132662242200297e-07, "loss": 1.1302, "step": 30098 }, { "epoch": 0.91, "learning_rate": 1.1319364721110698e-07, "loss": 1.0237, "step": 30099 }, { "epoch": 0.91, "learning_rate": 1.1312109292343138e-07, "loss": 1.1332, "step": 30100 }, { "epoch": 0.91, "learning_rate": 1.1304856135769343e-07, "loss": 1.072, "step": 30101 }, { "epoch": 0.91, "learning_rate": 1.1297605251458343e-07, "loss": 1.0743, "step": 30102 }, { "epoch": 0.91, "learning_rate": 1.1290356639479166e-07, "loss": 1.11, "step": 30103 }, { "epoch": 0.91, "learning_rate": 1.128311029990084e-07, "loss": 1.112, "step": 30104 }, { "epoch": 0.91, "learning_rate": 1.1275866232792365e-07, "loss": 1.058, "step": 30105 }, { "epoch": 0.91, "learning_rate": 1.1268624438222631e-07, "loss": 1.0443, "step": 30106 }, { "epoch": 0.91, "learning_rate": 1.1261384916260637e-07, "loss": 1.1503, "step": 30107 }, { "epoch": 0.91, "learning_rate": 1.1254147666975245e-07, "loss": 1.0897, "step": 30108 }, { "epoch": 0.91, "learning_rate": 1.124691269043543e-07, "loss": 1.1759, "step": 30109 }, { "epoch": 0.91, "learning_rate": 1.1239679986709995e-07, "loss": 1.1547, "step": 30110 }, { "epoch": 0.91, "learning_rate": 1.1232449555867803e-07, "loss": 0.9899, "step": 30111 }, { "epoch": 0.91, "learning_rate": 1.1225221397977714e-07, "loss": 1.1426, "step": 30112 }, { "epoch": 0.91, "learning_rate": 1.121799551310851e-07, "loss": 1.0906, "step": 30113 }, { "epoch": 0.91, "learning_rate": 1.1210771901328993e-07, "loss": 1.1703, "step": 30114 }, { "epoch": 0.91, "learning_rate": 1.1203550562707915e-07, "loss": 1.1172, "step": 30115 }, { "epoch": 0.91, "learning_rate": 1.1196331497314028e-07, "loss": 1.1083, "step": 30116 }, { "epoch": 0.91, "learning_rate": 1.1189114705216081e-07, "loss": 1.1182, "step": 30117 }, { "epoch": 0.91, "learning_rate": 1.1181900186482713e-07, "loss": 1.215, "step": 30118 }, { "epoch": 0.91, "learning_rate": 1.1174687941182649e-07, "loss": 0.9201, "step": 30119 }, { "epoch": 0.91, "learning_rate": 1.1167477969384527e-07, "loss": 1.0752, "step": 30120 }, { "epoch": 0.91, "learning_rate": 1.1160270271156987e-07, "loss": 1.1213, "step": 30121 }, { "epoch": 0.91, "learning_rate": 1.1153064846568667e-07, "loss": 1.0459, "step": 30122 }, { "epoch": 0.91, "learning_rate": 1.1145861695688126e-07, "loss": 1.0925, "step": 30123 }, { "epoch": 0.91, "learning_rate": 1.1138660818583919e-07, "loss": 1.0859, "step": 30124 }, { "epoch": 0.91, "learning_rate": 1.1131462215324657e-07, "loss": 1.1299, "step": 30125 }, { "epoch": 0.91, "learning_rate": 1.1124265885978813e-07, "loss": 1.0651, "step": 30126 }, { "epoch": 0.91, "learning_rate": 1.1117071830614945e-07, "loss": 1.0829, "step": 30127 }, { "epoch": 0.91, "learning_rate": 1.1109880049301469e-07, "loss": 0.9779, "step": 30128 }, { "epoch": 0.91, "learning_rate": 1.1102690542106887e-07, "loss": 1.0634, "step": 30129 }, { "epoch": 0.91, "learning_rate": 1.1095503309099614e-07, "loss": 1.1985, "step": 30130 }, { "epoch": 0.91, "learning_rate": 1.1088318350348126e-07, "loss": 1.0929, "step": 30131 }, { "epoch": 0.91, "learning_rate": 1.1081135665920783e-07, "loss": 1.1545, "step": 30132 }, { "epoch": 0.91, "learning_rate": 1.1073955255885921e-07, "loss": 1.075, "step": 30133 }, { "epoch": 0.91, "learning_rate": 1.1066777120311956e-07, "loss": 1.1537, "step": 30134 }, { "epoch": 0.91, "learning_rate": 1.105960125926725e-07, "loss": 1.0349, "step": 30135 }, { "epoch": 0.91, "learning_rate": 1.1052427672819998e-07, "loss": 1.1884, "step": 30136 }, { "epoch": 0.91, "learning_rate": 1.1045256361038565e-07, "loss": 0.9839, "step": 30137 }, { "epoch": 0.91, "learning_rate": 1.1038087323991197e-07, "loss": 1.0698, "step": 30138 }, { "epoch": 0.91, "learning_rate": 1.1030920561746178e-07, "loss": 1.0944, "step": 30139 }, { "epoch": 0.91, "learning_rate": 1.1023756074371699e-07, "loss": 1.0729, "step": 30140 }, { "epoch": 0.91, "learning_rate": 1.1016593861935959e-07, "loss": 1.136, "step": 30141 }, { "epoch": 0.91, "learning_rate": 1.1009433924507152e-07, "loss": 1.0079, "step": 30142 }, { "epoch": 0.91, "learning_rate": 1.1002276262153416e-07, "loss": 1.0829, "step": 30143 }, { "epoch": 0.91, "learning_rate": 1.0995120874942893e-07, "loss": 1.0803, "step": 30144 }, { "epoch": 0.91, "learning_rate": 1.0987967762943725e-07, "loss": 1.0894, "step": 30145 }, { "epoch": 0.91, "learning_rate": 1.0980816926223992e-07, "loss": 1.106, "step": 30146 }, { "epoch": 0.91, "learning_rate": 1.097366836485178e-07, "loss": 1.0002, "step": 30147 }, { "epoch": 0.91, "learning_rate": 1.0966522078895147e-07, "loss": 1.2068, "step": 30148 }, { "epoch": 0.91, "learning_rate": 1.0959378068422066e-07, "loss": 1.1108, "step": 30149 }, { "epoch": 0.91, "learning_rate": 1.0952236333500594e-07, "loss": 1.0667, "step": 30150 }, { "epoch": 0.91, "learning_rate": 1.0945096874198674e-07, "loss": 1.105, "step": 30151 }, { "epoch": 0.91, "learning_rate": 1.093795969058431e-07, "loss": 1.0487, "step": 30152 }, { "epoch": 0.91, "learning_rate": 1.0930824782725474e-07, "loss": 1.0914, "step": 30153 }, { "epoch": 0.91, "learning_rate": 1.092369215069003e-07, "loss": 1.1458, "step": 30154 }, { "epoch": 0.91, "learning_rate": 1.0916561794545865e-07, "loss": 1.0807, "step": 30155 }, { "epoch": 0.91, "learning_rate": 1.0909433714360901e-07, "loss": 1.072, "step": 30156 }, { "epoch": 0.91, "learning_rate": 1.0902307910202997e-07, "loss": 1.0776, "step": 30157 }, { "epoch": 0.91, "learning_rate": 1.0895184382139962e-07, "loss": 1.1892, "step": 30158 }, { "epoch": 0.91, "learning_rate": 1.0888063130239573e-07, "loss": 1.0361, "step": 30159 }, { "epoch": 0.91, "learning_rate": 1.0880944154569694e-07, "loss": 1.0978, "step": 30160 }, { "epoch": 0.91, "learning_rate": 1.0873827455198104e-07, "loss": 1.1135, "step": 30161 }, { "epoch": 0.91, "learning_rate": 1.0866713032192444e-07, "loss": 1.0961, "step": 30162 }, { "epoch": 0.91, "learning_rate": 1.085960088562052e-07, "loss": 1.0698, "step": 30163 }, { "epoch": 0.91, "learning_rate": 1.0852491015550026e-07, "loss": 1.1536, "step": 30164 }, { "epoch": 0.91, "learning_rate": 1.0845383422048689e-07, "loss": 1.0351, "step": 30165 }, { "epoch": 0.91, "learning_rate": 1.0838278105184064e-07, "loss": 1.0402, "step": 30166 }, { "epoch": 0.91, "learning_rate": 1.0831175065023846e-07, "loss": 1.0153, "step": 30167 }, { "epoch": 0.91, "learning_rate": 1.0824074301635679e-07, "loss": 1.0403, "step": 30168 }, { "epoch": 0.91, "learning_rate": 1.0816975815087116e-07, "loss": 1.1765, "step": 30169 }, { "epoch": 0.91, "learning_rate": 1.0809879605445745e-07, "loss": 1.0632, "step": 30170 }, { "epoch": 0.91, "learning_rate": 1.0802785672779121e-07, "loss": 1.1648, "step": 30171 }, { "epoch": 0.91, "learning_rate": 1.0795694017154773e-07, "loss": 1.1264, "step": 30172 }, { "epoch": 0.91, "learning_rate": 1.0788604638640232e-07, "loss": 1.2218, "step": 30173 }, { "epoch": 0.91, "learning_rate": 1.0781517537302971e-07, "loss": 1.1274, "step": 30174 }, { "epoch": 0.91, "learning_rate": 1.0774432713210437e-07, "loss": 1.1586, "step": 30175 }, { "epoch": 0.91, "learning_rate": 1.0767350166430101e-07, "loss": 1.1007, "step": 30176 }, { "epoch": 0.91, "learning_rate": 1.0760269897029357e-07, "loss": 1.1707, "step": 30177 }, { "epoch": 0.91, "learning_rate": 1.075319190507565e-07, "loss": 1.1369, "step": 30178 }, { "epoch": 0.91, "learning_rate": 1.0746116190636313e-07, "loss": 1.1356, "step": 30179 }, { "epoch": 0.91, "learning_rate": 1.073904275377871e-07, "loss": 1.1366, "step": 30180 }, { "epoch": 0.91, "learning_rate": 1.0731971594570206e-07, "loss": 1.1762, "step": 30181 }, { "epoch": 0.91, "learning_rate": 1.0724902713078078e-07, "loss": 1.1076, "step": 30182 }, { "epoch": 0.91, "learning_rate": 1.0717836109369661e-07, "loss": 1.0903, "step": 30183 }, { "epoch": 0.91, "learning_rate": 1.071077178351218e-07, "loss": 1.0933, "step": 30184 }, { "epoch": 0.91, "learning_rate": 1.0703709735572914e-07, "loss": 1.0546, "step": 30185 }, { "epoch": 0.91, "learning_rate": 1.0696649965619088e-07, "loss": 1.111, "step": 30186 }, { "epoch": 0.91, "learning_rate": 1.0689592473717924e-07, "loss": 1.0284, "step": 30187 }, { "epoch": 0.91, "learning_rate": 1.0682537259936538e-07, "loss": 1.0992, "step": 30188 }, { "epoch": 0.91, "learning_rate": 1.067548432434215e-07, "loss": 1.0661, "step": 30189 }, { "epoch": 0.91, "learning_rate": 1.0668433667001904e-07, "loss": 1.028, "step": 30190 }, { "epoch": 0.91, "learning_rate": 1.0661385287982912e-07, "loss": 1.1108, "step": 30191 }, { "epoch": 0.91, "learning_rate": 1.0654339187352231e-07, "loss": 1.1819, "step": 30192 }, { "epoch": 0.91, "learning_rate": 1.0647295365177002e-07, "loss": 1.1506, "step": 30193 }, { "epoch": 0.91, "learning_rate": 1.0640253821524199e-07, "loss": 1.1664, "step": 30194 }, { "epoch": 0.91, "learning_rate": 1.0633214556460936e-07, "loss": 1.025, "step": 30195 }, { "epoch": 0.91, "learning_rate": 1.0626177570054158e-07, "loss": 1.0486, "step": 30196 }, { "epoch": 0.91, "learning_rate": 1.0619142862370896e-07, "loss": 1.1199, "step": 30197 }, { "epoch": 0.91, "learning_rate": 1.0612110433478123e-07, "loss": 1.0844, "step": 30198 }, { "epoch": 0.91, "learning_rate": 1.0605080283442759e-07, "loss": 1.142, "step": 30199 }, { "epoch": 0.91, "learning_rate": 1.0598052412331722e-07, "loss": 0.9826, "step": 30200 }, { "epoch": 0.91, "learning_rate": 1.059102682021193e-07, "loss": 1.1019, "step": 30201 }, { "epoch": 0.91, "learning_rate": 1.0584003507150276e-07, "loss": 1.1794, "step": 30202 }, { "epoch": 0.91, "learning_rate": 1.0576982473213565e-07, "loss": 1.0066, "step": 30203 }, { "epoch": 0.91, "learning_rate": 1.0569963718468718e-07, "loss": 1.1012, "step": 30204 }, { "epoch": 0.91, "learning_rate": 1.0562947242982485e-07, "loss": 1.0739, "step": 30205 }, { "epoch": 0.91, "learning_rate": 1.0555933046821676e-07, "loss": 1.223, "step": 30206 }, { "epoch": 0.91, "learning_rate": 1.0548921130053041e-07, "loss": 1.0874, "step": 30207 }, { "epoch": 0.91, "learning_rate": 1.0541911492743362e-07, "loss": 1.0314, "step": 30208 }, { "epoch": 0.91, "learning_rate": 1.053490413495939e-07, "loss": 1.1464, "step": 30209 }, { "epoch": 0.91, "learning_rate": 1.0527899056767792e-07, "loss": 1.0441, "step": 30210 }, { "epoch": 0.91, "learning_rate": 1.0520896258235242e-07, "loss": 1.0737, "step": 30211 }, { "epoch": 0.91, "learning_rate": 1.0513895739428403e-07, "loss": 1.1869, "step": 30212 }, { "epoch": 0.91, "learning_rate": 1.0506897500414003e-07, "loss": 1.1655, "step": 30213 }, { "epoch": 0.91, "learning_rate": 1.0499901541258545e-07, "loss": 1.07, "step": 30214 }, { "epoch": 0.91, "learning_rate": 1.0492907862028668e-07, "loss": 0.9963, "step": 30215 }, { "epoch": 0.91, "learning_rate": 1.0485916462790985e-07, "loss": 1.0417, "step": 30216 }, { "epoch": 0.91, "learning_rate": 1.0478927343612028e-07, "loss": 1.1667, "step": 30217 }, { "epoch": 0.91, "learning_rate": 1.0471940504558325e-07, "loss": 1.1489, "step": 30218 }, { "epoch": 0.91, "learning_rate": 1.0464955945696353e-07, "loss": 1.0305, "step": 30219 }, { "epoch": 0.91, "learning_rate": 1.045797366709267e-07, "loss": 1.0667, "step": 30220 }, { "epoch": 0.91, "learning_rate": 1.0450993668813692e-07, "loss": 1.1262, "step": 30221 }, { "epoch": 0.91, "learning_rate": 1.0444015950925895e-07, "loss": 1.0638, "step": 30222 }, { "epoch": 0.91, "learning_rate": 1.0437040513495699e-07, "loss": 1.0271, "step": 30223 }, { "epoch": 0.91, "learning_rate": 1.0430067356589469e-07, "loss": 1.2325, "step": 30224 }, { "epoch": 0.91, "learning_rate": 1.042309648027362e-07, "loss": 0.9403, "step": 30225 }, { "epoch": 0.91, "learning_rate": 1.0416127884614518e-07, "loss": 1.0981, "step": 30226 }, { "epoch": 0.91, "learning_rate": 1.04091615696785e-07, "loss": 1.2012, "step": 30227 }, { "epoch": 0.91, "learning_rate": 1.0402197535531872e-07, "loss": 1.0907, "step": 30228 }, { "epoch": 0.91, "learning_rate": 1.0395235782240914e-07, "loss": 1.0908, "step": 30229 }, { "epoch": 0.91, "learning_rate": 1.0388276309871937e-07, "loss": 1.0824, "step": 30230 }, { "epoch": 0.91, "learning_rate": 1.0381319118491162e-07, "loss": 1.2488, "step": 30231 }, { "epoch": 0.91, "learning_rate": 1.0374364208164817e-07, "loss": 1.0852, "step": 30232 }, { "epoch": 0.91, "learning_rate": 1.0367411578959125e-07, "loss": 1.0557, "step": 30233 }, { "epoch": 0.91, "learning_rate": 1.0360461230940228e-07, "loss": 1.1377, "step": 30234 }, { "epoch": 0.91, "learning_rate": 1.0353513164174406e-07, "loss": 1.0313, "step": 30235 }, { "epoch": 0.91, "learning_rate": 1.0346567378727663e-07, "loss": 1.2109, "step": 30236 }, { "epoch": 0.91, "learning_rate": 1.0339623874666166e-07, "loss": 1.041, "step": 30237 }, { "epoch": 0.91, "learning_rate": 1.0332682652056059e-07, "loss": 1.1484, "step": 30238 }, { "epoch": 0.91, "learning_rate": 1.0325743710963398e-07, "loss": 1.072, "step": 30239 }, { "epoch": 0.91, "learning_rate": 1.0318807051454188e-07, "loss": 1.0203, "step": 30240 }, { "epoch": 0.91, "learning_rate": 1.0311872673594514e-07, "loss": 1.1251, "step": 30241 }, { "epoch": 0.91, "learning_rate": 1.0304940577450351e-07, "loss": 1.1777, "step": 30242 }, { "epoch": 0.91, "learning_rate": 1.0298010763087757e-07, "loss": 1.0991, "step": 30243 }, { "epoch": 0.91, "learning_rate": 1.0291083230572623e-07, "loss": 1.1956, "step": 30244 }, { "epoch": 0.91, "learning_rate": 1.0284157979970954e-07, "loss": 1.131, "step": 30245 }, { "epoch": 0.91, "learning_rate": 1.0277235011348612e-07, "loss": 0.9976, "step": 30246 }, { "epoch": 0.91, "learning_rate": 1.0270314324771574e-07, "loss": 1.0422, "step": 30247 }, { "epoch": 0.91, "learning_rate": 1.0263395920305675e-07, "loss": 1.1157, "step": 30248 }, { "epoch": 0.91, "learning_rate": 1.0256479798016777e-07, "loss": 1.1427, "step": 30249 }, { "epoch": 0.91, "learning_rate": 1.0249565957970747e-07, "loss": 1.0043, "step": 30250 }, { "epoch": 0.91, "learning_rate": 1.0242654400233365e-07, "loss": 1.071, "step": 30251 }, { "epoch": 0.91, "learning_rate": 1.0235745124870439e-07, "loss": 1.1201, "step": 30252 }, { "epoch": 0.91, "learning_rate": 1.022883813194775e-07, "loss": 1.0264, "step": 30253 }, { "epoch": 0.91, "learning_rate": 1.0221933421531022e-07, "loss": 1.0884, "step": 30254 }, { "epoch": 0.91, "learning_rate": 1.0215030993686038e-07, "loss": 1.1501, "step": 30255 }, { "epoch": 0.91, "learning_rate": 1.0208130848478493e-07, "loss": 1.0922, "step": 30256 }, { "epoch": 0.91, "learning_rate": 1.0201232985974002e-07, "loss": 1.0502, "step": 30257 }, { "epoch": 0.91, "learning_rate": 1.0194337406238319e-07, "loss": 1.0939, "step": 30258 }, { "epoch": 0.91, "learning_rate": 1.018744410933703e-07, "loss": 1.076, "step": 30259 }, { "epoch": 0.91, "learning_rate": 1.0180553095335777e-07, "loss": 1.1203, "step": 30260 }, { "epoch": 0.91, "learning_rate": 1.0173664364300202e-07, "loss": 1.1708, "step": 30261 }, { "epoch": 0.91, "learning_rate": 1.0166777916295778e-07, "loss": 1.1263, "step": 30262 }, { "epoch": 0.91, "learning_rate": 1.015989375138815e-07, "loss": 1.1046, "step": 30263 }, { "epoch": 0.91, "learning_rate": 1.0153011869642792e-07, "loss": 1.0416, "step": 30264 }, { "epoch": 0.91, "learning_rate": 1.014613227112532e-07, "loss": 1.0682, "step": 30265 }, { "epoch": 0.91, "learning_rate": 1.0139254955901095e-07, "loss": 1.1908, "step": 30266 }, { "epoch": 0.91, "learning_rate": 1.0132379924035624e-07, "loss": 1.1316, "step": 30267 }, { "epoch": 0.91, "learning_rate": 1.0125507175594406e-07, "loss": 1.194, "step": 30268 }, { "epoch": 0.91, "learning_rate": 1.0118636710642838e-07, "loss": 1.1383, "step": 30269 }, { "epoch": 0.91, "learning_rate": 1.0111768529246307e-07, "loss": 1.0144, "step": 30270 }, { "epoch": 0.91, "learning_rate": 1.0104902631470181e-07, "loss": 0.9127, "step": 30271 }, { "epoch": 0.91, "learning_rate": 1.0098039017379852e-07, "loss": 1.1296, "step": 30272 }, { "epoch": 0.91, "learning_rate": 1.0091177687040681e-07, "loss": 1.1442, "step": 30273 }, { "epoch": 0.91, "learning_rate": 1.0084318640517953e-07, "loss": 1.1926, "step": 30274 }, { "epoch": 0.91, "learning_rate": 1.0077461877876948e-07, "loss": 1.0847, "step": 30275 }, { "epoch": 0.91, "learning_rate": 1.0070607399182947e-07, "loss": 1.1053, "step": 30276 }, { "epoch": 0.91, "learning_rate": 1.0063755204501203e-07, "loss": 1.113, "step": 30277 }, { "epoch": 0.91, "learning_rate": 1.0056905293896967e-07, "loss": 1.0003, "step": 30278 }, { "epoch": 0.91, "learning_rate": 1.0050057667435414e-07, "loss": 1.1357, "step": 30279 }, { "epoch": 0.91, "learning_rate": 1.0043212325181767e-07, "loss": 1.2367, "step": 30280 }, { "epoch": 0.91, "learning_rate": 1.0036369267201169e-07, "loss": 1.1922, "step": 30281 }, { "epoch": 0.91, "learning_rate": 1.0029528493558788e-07, "loss": 1.1457, "step": 30282 }, { "epoch": 0.91, "learning_rate": 1.0022690004319685e-07, "loss": 1.1838, "step": 30283 }, { "epoch": 0.91, "learning_rate": 1.001585379954903e-07, "loss": 1.0746, "step": 30284 }, { "epoch": 0.91, "learning_rate": 1.0009019879311826e-07, "loss": 1.0298, "step": 30285 }, { "epoch": 0.91, "learning_rate": 1.0002188243673188e-07, "loss": 1.0428, "step": 30286 }, { "epoch": 0.91, "learning_rate": 9.995358892698149e-08, "loss": 1.2178, "step": 30287 }, { "epoch": 0.91, "learning_rate": 9.988531826451681e-08, "loss": 1.0825, "step": 30288 }, { "epoch": 0.91, "learning_rate": 9.981707044998817e-08, "loss": 1.1985, "step": 30289 }, { "epoch": 0.91, "learning_rate": 9.974884548404478e-08, "loss": 1.1217, "step": 30290 }, { "epoch": 0.91, "learning_rate": 9.968064336733669e-08, "loss": 1.1909, "step": 30291 }, { "epoch": 0.91, "learning_rate": 9.961246410051279e-08, "loss": 1.2288, "step": 30292 }, { "epoch": 0.91, "learning_rate": 9.954430768422201e-08, "loss": 1.2471, "step": 30293 }, { "epoch": 0.91, "learning_rate": 9.947617411911331e-08, "loss": 1.0167, "step": 30294 }, { "epoch": 0.91, "learning_rate": 9.940806340583559e-08, "loss": 1.1023, "step": 30295 }, { "epoch": 0.91, "learning_rate": 9.933997554503665e-08, "loss": 1.0363, "step": 30296 }, { "epoch": 0.91, "learning_rate": 9.92719105373649e-08, "loss": 1.0713, "step": 30297 }, { "epoch": 0.91, "learning_rate": 9.92038683834684e-08, "loss": 1.1255, "step": 30298 }, { "epoch": 0.91, "learning_rate": 9.91358490839947e-08, "loss": 1.1127, "step": 30299 }, { "epoch": 0.91, "learning_rate": 9.90678526395919e-08, "loss": 1.1151, "step": 30300 }, { "epoch": 0.91, "learning_rate": 9.899987905090641e-08, "loss": 1.1649, "step": 30301 }, { "epoch": 0.91, "learning_rate": 9.893192831858577e-08, "loss": 1.134, "step": 30302 }, { "epoch": 0.91, "learning_rate": 9.886400044327671e-08, "loss": 1.0986, "step": 30303 }, { "epoch": 0.91, "learning_rate": 9.879609542562618e-08, "loss": 1.1624, "step": 30304 }, { "epoch": 0.91, "learning_rate": 9.872821326628007e-08, "loss": 1.2322, "step": 30305 }, { "epoch": 0.91, "learning_rate": 9.866035396588508e-08, "loss": 1.1051, "step": 30306 }, { "epoch": 0.91, "learning_rate": 9.859251752508681e-08, "loss": 1.0684, "step": 30307 }, { "epoch": 0.91, "learning_rate": 9.852470394453112e-08, "loss": 1.2218, "step": 30308 }, { "epoch": 0.91, "learning_rate": 9.84569132248639e-08, "loss": 1.1389, "step": 30309 }, { "epoch": 0.91, "learning_rate": 9.838914536673016e-08, "loss": 1.1479, "step": 30310 }, { "epoch": 0.91, "learning_rate": 9.832140037077498e-08, "loss": 1.2616, "step": 30311 }, { "epoch": 0.91, "learning_rate": 9.825367823764364e-08, "loss": 1.0634, "step": 30312 }, { "epoch": 0.91, "learning_rate": 9.818597896798065e-08, "loss": 1.1763, "step": 30313 }, { "epoch": 0.91, "learning_rate": 9.811830256243021e-08, "loss": 1.0643, "step": 30314 }, { "epoch": 0.91, "learning_rate": 9.805064902163652e-08, "loss": 1.0906, "step": 30315 }, { "epoch": 0.91, "learning_rate": 9.798301834624408e-08, "loss": 1.0898, "step": 30316 }, { "epoch": 0.91, "learning_rate": 9.791541053689679e-08, "loss": 1.171, "step": 30317 }, { "epoch": 0.91, "learning_rate": 9.78478255942375e-08, "loss": 1.002, "step": 30318 }, { "epoch": 0.91, "learning_rate": 9.778026351890985e-08, "loss": 1.1608, "step": 30319 }, { "epoch": 0.91, "learning_rate": 9.771272431155721e-08, "loss": 1.0861, "step": 30320 }, { "epoch": 0.91, "learning_rate": 9.764520797282295e-08, "loss": 1.0458, "step": 30321 }, { "epoch": 0.91, "learning_rate": 9.75777145033488e-08, "loss": 1.048, "step": 30322 }, { "epoch": 0.91, "learning_rate": 9.751024390377784e-08, "loss": 1.0442, "step": 30323 }, { "epoch": 0.91, "learning_rate": 9.744279617475233e-08, "loss": 1.186, "step": 30324 }, { "epoch": 0.91, "learning_rate": 9.737537131691427e-08, "loss": 0.986, "step": 30325 }, { "epoch": 0.91, "learning_rate": 9.730796933090564e-08, "loss": 1.013, "step": 30326 }, { "epoch": 0.91, "learning_rate": 9.724059021736787e-08, "loss": 1.0962, "step": 30327 }, { "epoch": 0.91, "learning_rate": 9.71732339769424e-08, "loss": 1.0745, "step": 30328 }, { "epoch": 0.91, "learning_rate": 9.710590061027065e-08, "loss": 1.0826, "step": 30329 }, { "epoch": 0.91, "learning_rate": 9.70385901179935e-08, "loss": 1.1052, "step": 30330 }, { "epoch": 0.91, "learning_rate": 9.697130250075154e-08, "loss": 1.2551, "step": 30331 }, { "epoch": 0.91, "learning_rate": 9.69040377591854e-08, "loss": 1.1078, "step": 30332 }, { "epoch": 0.91, "learning_rate": 9.683679589393535e-08, "loss": 1.0211, "step": 30333 }, { "epoch": 0.91, "learning_rate": 9.676957690564176e-08, "loss": 1.0665, "step": 30334 }, { "epoch": 0.91, "learning_rate": 9.670238079494437e-08, "loss": 1.1661, "step": 30335 }, { "epoch": 0.91, "learning_rate": 9.663520756248269e-08, "loss": 1.1434, "step": 30336 }, { "epoch": 0.91, "learning_rate": 9.656805720889645e-08, "loss": 1.122, "step": 30337 }, { "epoch": 0.91, "learning_rate": 9.65009297348246e-08, "loss": 1.0194, "step": 30338 }, { "epoch": 0.91, "learning_rate": 9.643382514090694e-08, "loss": 1.0815, "step": 30339 }, { "epoch": 0.91, "learning_rate": 9.636674342778097e-08, "loss": 1.0017, "step": 30340 }, { "epoch": 0.91, "learning_rate": 9.629968459608619e-08, "loss": 1.1663, "step": 30341 }, { "epoch": 0.91, "learning_rate": 9.623264864646098e-08, "loss": 1.1552, "step": 30342 }, { "epoch": 0.91, "learning_rate": 9.616563557954317e-08, "loss": 1.1179, "step": 30343 }, { "epoch": 0.91, "learning_rate": 9.609864539597058e-08, "loss": 1.2257, "step": 30344 }, { "epoch": 0.91, "learning_rate": 9.60316780963813e-08, "loss": 1.0997, "step": 30345 }, { "epoch": 0.91, "learning_rate": 9.596473368141262e-08, "loss": 0.9774, "step": 30346 }, { "epoch": 0.91, "learning_rate": 9.589781215170207e-08, "loss": 1.0636, "step": 30347 }, { "epoch": 0.91, "learning_rate": 9.583091350788609e-08, "loss": 1.1517, "step": 30348 }, { "epoch": 0.91, "learning_rate": 9.576403775060223e-08, "loss": 1.0599, "step": 30349 }, { "epoch": 0.91, "learning_rate": 9.569718488048662e-08, "loss": 1.0758, "step": 30350 }, { "epoch": 0.91, "learning_rate": 9.563035489817602e-08, "loss": 1.1433, "step": 30351 }, { "epoch": 0.91, "learning_rate": 9.556354780430627e-08, "loss": 1.2188, "step": 30352 }, { "epoch": 0.91, "learning_rate": 9.549676359951355e-08, "loss": 1.0825, "step": 30353 }, { "epoch": 0.91, "learning_rate": 9.543000228443373e-08, "loss": 1.0635, "step": 30354 }, { "epoch": 0.91, "learning_rate": 9.536326385970213e-08, "loss": 1.0839, "step": 30355 }, { "epoch": 0.91, "learning_rate": 9.529654832595437e-08, "loss": 0.9891, "step": 30356 }, { "epoch": 0.91, "learning_rate": 9.522985568382492e-08, "loss": 1.0396, "step": 30357 }, { "epoch": 0.91, "learning_rate": 9.516318593394913e-08, "loss": 1.2145, "step": 30358 }, { "epoch": 0.91, "learning_rate": 9.509653907696176e-08, "loss": 1.017, "step": 30359 }, { "epoch": 0.91, "learning_rate": 9.502991511349702e-08, "loss": 1.0858, "step": 30360 }, { "epoch": 0.91, "learning_rate": 9.496331404418913e-08, "loss": 1.0364, "step": 30361 }, { "epoch": 0.91, "learning_rate": 9.48967358696723e-08, "loss": 1.1296, "step": 30362 }, { "epoch": 0.91, "learning_rate": 9.483018059058018e-08, "loss": 1.1488, "step": 30363 }, { "epoch": 0.91, "learning_rate": 9.476364820754674e-08, "loss": 1.0193, "step": 30364 }, { "epoch": 0.91, "learning_rate": 9.469713872120451e-08, "loss": 0.9943, "step": 30365 }, { "epoch": 0.91, "learning_rate": 9.463065213218714e-08, "loss": 1.0171, "step": 30366 }, { "epoch": 0.91, "learning_rate": 9.456418844112747e-08, "loss": 1.108, "step": 30367 }, { "epoch": 0.91, "learning_rate": 9.449774764865832e-08, "loss": 1.1568, "step": 30368 }, { "epoch": 0.91, "learning_rate": 9.443132975541225e-08, "loss": 1.0705, "step": 30369 }, { "epoch": 0.91, "learning_rate": 9.436493476202124e-08, "loss": 1.0365, "step": 30370 }, { "epoch": 0.91, "learning_rate": 9.42985626691173e-08, "loss": 1.1221, "step": 30371 }, { "epoch": 0.91, "learning_rate": 9.423221347733242e-08, "loss": 0.9843, "step": 30372 }, { "epoch": 0.91, "learning_rate": 9.416588718729858e-08, "loss": 1.1678, "step": 30373 }, { "epoch": 0.92, "learning_rate": 9.409958379964668e-08, "loss": 1.2143, "step": 30374 }, { "epoch": 0.92, "learning_rate": 9.40333033150076e-08, "loss": 1.1132, "step": 30375 }, { "epoch": 0.92, "learning_rate": 9.396704573401305e-08, "loss": 1.0312, "step": 30376 }, { "epoch": 0.92, "learning_rate": 9.390081105729366e-08, "loss": 1.1953, "step": 30377 }, { "epoch": 0.92, "learning_rate": 9.383459928547944e-08, "loss": 0.991, "step": 30378 }, { "epoch": 0.92, "learning_rate": 9.376841041920076e-08, "loss": 1.1502, "step": 30379 }, { "epoch": 0.92, "learning_rate": 9.37022444590882e-08, "loss": 1.0414, "step": 30380 }, { "epoch": 0.92, "learning_rate": 9.363610140577128e-08, "loss": 1.1029, "step": 30381 }, { "epoch": 0.92, "learning_rate": 9.356998125988004e-08, "loss": 1.1242, "step": 30382 }, { "epoch": 0.92, "learning_rate": 9.350388402204341e-08, "loss": 1.1713, "step": 30383 }, { "epoch": 0.92, "learning_rate": 9.343780969289062e-08, "loss": 1.0089, "step": 30384 }, { "epoch": 0.92, "learning_rate": 9.33717582730509e-08, "loss": 1.1522, "step": 30385 }, { "epoch": 0.92, "learning_rate": 9.330572976315344e-08, "loss": 1.0726, "step": 30386 }, { "epoch": 0.92, "learning_rate": 9.323972416382582e-08, "loss": 1.0391, "step": 30387 }, { "epoch": 0.92, "learning_rate": 9.317374147569697e-08, "loss": 1.1496, "step": 30388 }, { "epoch": 0.92, "learning_rate": 9.310778169939472e-08, "loss": 1.0824, "step": 30389 }, { "epoch": 0.92, "learning_rate": 9.304184483554746e-08, "loss": 1.0789, "step": 30390 }, { "epoch": 0.92, "learning_rate": 9.297593088478246e-08, "loss": 1.05, "step": 30391 }, { "epoch": 0.92, "learning_rate": 9.291003984772757e-08, "loss": 1.1237, "step": 30392 }, { "epoch": 0.92, "learning_rate": 9.284417172500948e-08, "loss": 0.985, "step": 30393 }, { "epoch": 0.92, "learning_rate": 9.277832651725577e-08, "loss": 1.0894, "step": 30394 }, { "epoch": 0.92, "learning_rate": 9.271250422509315e-08, "loss": 1.0644, "step": 30395 }, { "epoch": 0.92, "learning_rate": 9.264670484914806e-08, "loss": 1.1415, "step": 30396 }, { "epoch": 0.92, "learning_rate": 9.258092839004667e-08, "loss": 1.0966, "step": 30397 }, { "epoch": 0.92, "learning_rate": 9.251517484841544e-08, "loss": 1.2117, "step": 30398 }, { "epoch": 0.92, "learning_rate": 9.244944422488078e-08, "loss": 1.121, "step": 30399 }, { "epoch": 0.92, "learning_rate": 9.238373652006722e-08, "loss": 1.0259, "step": 30400 }, { "epoch": 0.92, "learning_rate": 9.231805173460117e-08, "loss": 1.0891, "step": 30401 }, { "epoch": 0.92, "learning_rate": 9.225238986910773e-08, "loss": 1.0615, "step": 30402 }, { "epoch": 0.92, "learning_rate": 9.21867509242122e-08, "loss": 1.1944, "step": 30403 }, { "epoch": 0.92, "learning_rate": 9.21211349005388e-08, "loss": 1.0731, "step": 30404 }, { "epoch": 0.92, "learning_rate": 9.205554179871262e-08, "loss": 1.1587, "step": 30405 }, { "epoch": 0.92, "learning_rate": 9.198997161935786e-08, "loss": 1.1902, "step": 30406 }, { "epoch": 0.92, "learning_rate": 9.192442436309872e-08, "loss": 0.9587, "step": 30407 }, { "epoch": 0.92, "learning_rate": 9.185890003055975e-08, "loss": 1.1149, "step": 30408 }, { "epoch": 0.92, "learning_rate": 9.179339862236403e-08, "loss": 1.1191, "step": 30409 }, { "epoch": 0.92, "learning_rate": 9.172792013913523e-08, "loss": 1.166, "step": 30410 }, { "epoch": 0.92, "learning_rate": 9.166246458149674e-08, "loss": 1.1046, "step": 30411 }, { "epoch": 0.92, "learning_rate": 9.159703195007197e-08, "loss": 1.1839, "step": 30412 }, { "epoch": 0.92, "learning_rate": 9.153162224548346e-08, "loss": 0.9775, "step": 30413 }, { "epoch": 0.92, "learning_rate": 9.146623546835376e-08, "loss": 1.0676, "step": 30414 }, { "epoch": 0.92, "learning_rate": 9.140087161930545e-08, "loss": 0.9849, "step": 30415 }, { "epoch": 0.92, "learning_rate": 9.133553069896078e-08, "loss": 1.0186, "step": 30416 }, { "epoch": 0.92, "learning_rate": 9.127021270794206e-08, "loss": 1.0588, "step": 30417 }, { "epoch": 0.92, "learning_rate": 9.120491764687073e-08, "loss": 1.0319, "step": 30418 }, { "epoch": 0.92, "learning_rate": 9.113964551636823e-08, "loss": 0.966, "step": 30419 }, { "epoch": 0.92, "learning_rate": 9.107439631705656e-08, "loss": 1.0743, "step": 30420 }, { "epoch": 0.92, "learning_rate": 9.100917004955634e-08, "loss": 1.0274, "step": 30421 }, { "epoch": 0.92, "learning_rate": 9.094396671448873e-08, "loss": 1.0374, "step": 30422 }, { "epoch": 0.92, "learning_rate": 9.08787863124741e-08, "loss": 1.0643, "step": 30423 }, { "epoch": 0.92, "learning_rate": 9.081362884413303e-08, "loss": 1.2008, "step": 30424 }, { "epoch": 0.92, "learning_rate": 9.074849431008642e-08, "loss": 1.213, "step": 30425 }, { "epoch": 0.92, "learning_rate": 9.06833827109535e-08, "loss": 1.05, "step": 30426 }, { "epoch": 0.92, "learning_rate": 9.061829404735434e-08, "loss": 1.0911, "step": 30427 }, { "epoch": 0.92, "learning_rate": 9.055322831990843e-08, "loss": 1.0226, "step": 30428 }, { "epoch": 0.92, "learning_rate": 9.048818552923583e-08, "loss": 1.2062, "step": 30429 }, { "epoch": 0.92, "learning_rate": 9.042316567595494e-08, "loss": 1.1703, "step": 30430 }, { "epoch": 0.92, "learning_rate": 9.035816876068527e-08, "loss": 1.1321, "step": 30431 }, { "epoch": 0.92, "learning_rate": 9.029319478404492e-08, "loss": 1.1107, "step": 30432 }, { "epoch": 0.92, "learning_rate": 9.022824374665312e-08, "loss": 1.1783, "step": 30433 }, { "epoch": 0.92, "learning_rate": 9.0163315649128e-08, "loss": 1.1313, "step": 30434 }, { "epoch": 0.92, "learning_rate": 9.009841049208712e-08, "loss": 1.0481, "step": 30435 }, { "epoch": 0.92, "learning_rate": 9.003352827614887e-08, "loss": 1.0588, "step": 30436 }, { "epoch": 0.92, "learning_rate": 8.996866900193051e-08, "loss": 1.0737, "step": 30437 }, { "epoch": 0.92, "learning_rate": 8.990383267005021e-08, "loss": 1.2253, "step": 30438 }, { "epoch": 0.92, "learning_rate": 8.983901928112438e-08, "loss": 1.0887, "step": 30439 }, { "epoch": 0.92, "learning_rate": 8.977422883577031e-08, "loss": 1.1049, "step": 30440 }, { "epoch": 0.92, "learning_rate": 8.970946133460473e-08, "loss": 0.9782, "step": 30441 }, { "epoch": 0.92, "learning_rate": 8.964471677824438e-08, "loss": 1.2352, "step": 30442 }, { "epoch": 0.92, "learning_rate": 8.957999516730515e-08, "loss": 1.2133, "step": 30443 }, { "epoch": 0.92, "learning_rate": 8.951529650240376e-08, "loss": 1.0993, "step": 30444 }, { "epoch": 0.92, "learning_rate": 8.945062078415556e-08, "loss": 1.0892, "step": 30445 }, { "epoch": 0.92, "learning_rate": 8.938596801317701e-08, "loss": 1.148, "step": 30446 }, { "epoch": 0.92, "learning_rate": 8.932133819008287e-08, "loss": 1.1074, "step": 30447 }, { "epoch": 0.92, "learning_rate": 8.925673131548823e-08, "loss": 1.0212, "step": 30448 }, { "epoch": 0.92, "learning_rate": 8.91921473900087e-08, "loss": 1.1466, "step": 30449 }, { "epoch": 0.92, "learning_rate": 8.912758641425878e-08, "loss": 1.011, "step": 30450 }, { "epoch": 0.92, "learning_rate": 8.906304838885326e-08, "loss": 1.0765, "step": 30451 }, { "epoch": 0.92, "learning_rate": 8.899853331440639e-08, "loss": 1.0986, "step": 30452 }, { "epoch": 0.92, "learning_rate": 8.893404119153209e-08, "loss": 0.9589, "step": 30453 }, { "epoch": 0.92, "learning_rate": 8.886957202084434e-08, "loss": 1.0779, "step": 30454 }, { "epoch": 0.92, "learning_rate": 8.880512580295764e-08, "loss": 1.1797, "step": 30455 }, { "epoch": 0.92, "learning_rate": 8.874070253848455e-08, "loss": 1.1885, "step": 30456 }, { "epoch": 0.92, "learning_rate": 8.867630222803846e-08, "loss": 1.1421, "step": 30457 }, { "epoch": 0.92, "learning_rate": 8.86119248722328e-08, "loss": 1.1725, "step": 30458 }, { "epoch": 0.92, "learning_rate": 8.854757047168011e-08, "loss": 1.065, "step": 30459 }, { "epoch": 0.92, "learning_rate": 8.848323902699352e-08, "loss": 1.1372, "step": 30460 }, { "epoch": 0.92, "learning_rate": 8.841893053878503e-08, "loss": 1.1373, "step": 30461 }, { "epoch": 0.92, "learning_rate": 8.835464500766638e-08, "loss": 1.1039, "step": 30462 }, { "epoch": 0.92, "learning_rate": 8.829038243425042e-08, "loss": 1.1251, "step": 30463 }, { "epoch": 0.92, "learning_rate": 8.82261428191486e-08, "loss": 1.1587, "step": 30464 }, { "epoch": 0.92, "learning_rate": 8.816192616297209e-08, "loss": 1.1401, "step": 30465 }, { "epoch": 0.92, "learning_rate": 8.809773246633263e-08, "loss": 1.1097, "step": 30466 }, { "epoch": 0.92, "learning_rate": 8.803356172984085e-08, "loss": 1.1063, "step": 30467 }, { "epoch": 0.92, "learning_rate": 8.796941395410846e-08, "loss": 1.0992, "step": 30468 }, { "epoch": 0.92, "learning_rate": 8.7905289139745e-08, "loss": 1.1382, "step": 30469 }, { "epoch": 0.92, "learning_rate": 8.784118728736163e-08, "loss": 1.0737, "step": 30470 }, { "epoch": 0.92, "learning_rate": 8.77771083975687e-08, "loss": 1.0503, "step": 30471 }, { "epoch": 0.92, "learning_rate": 8.771305247097544e-08, "loss": 1.0841, "step": 30472 }, { "epoch": 0.92, "learning_rate": 8.764901950819249e-08, "loss": 1.046, "step": 30473 }, { "epoch": 0.92, "learning_rate": 8.758500950982879e-08, "loss": 1.2051, "step": 30474 }, { "epoch": 0.92, "learning_rate": 8.752102247649413e-08, "loss": 1.0961, "step": 30475 }, { "epoch": 0.92, "learning_rate": 8.745705840879748e-08, "loss": 1.0496, "step": 30476 }, { "epoch": 0.92, "learning_rate": 8.739311730734779e-08, "loss": 1.0963, "step": 30477 }, { "epoch": 0.92, "learning_rate": 8.732919917275373e-08, "loss": 0.9777, "step": 30478 }, { "epoch": 0.92, "learning_rate": 8.726530400562344e-08, "loss": 1.0782, "step": 30479 }, { "epoch": 0.92, "learning_rate": 8.720143180656532e-08, "loss": 1.003, "step": 30480 }, { "epoch": 0.92, "learning_rate": 8.713758257618804e-08, "loss": 1.1273, "step": 30481 }, { "epoch": 0.92, "learning_rate": 8.707375631509863e-08, "loss": 1.0551, "step": 30482 }, { "epoch": 0.92, "learning_rate": 8.700995302390491e-08, "loss": 1.09, "step": 30483 }, { "epoch": 0.92, "learning_rate": 8.694617270321421e-08, "loss": 1.0632, "step": 30484 }, { "epoch": 0.92, "learning_rate": 8.688241535363379e-08, "loss": 1.1705, "step": 30485 }, { "epoch": 0.92, "learning_rate": 8.681868097577095e-08, "loss": 0.956, "step": 30486 }, { "epoch": 0.92, "learning_rate": 8.675496957023161e-08, "loss": 1.2267, "step": 30487 }, { "epoch": 0.92, "learning_rate": 8.669128113762305e-08, "loss": 1.0955, "step": 30488 }, { "epoch": 0.92, "learning_rate": 8.662761567855087e-08, "loss": 1.217, "step": 30489 }, { "epoch": 0.92, "learning_rate": 8.656397319362186e-08, "loss": 1.1616, "step": 30490 }, { "epoch": 0.92, "learning_rate": 8.650035368344106e-08, "loss": 1.04, "step": 30491 }, { "epoch": 0.92, "learning_rate": 8.643675714861466e-08, "loss": 1.1689, "step": 30492 }, { "epoch": 0.92, "learning_rate": 8.6373183589748e-08, "loss": 1.1791, "step": 30493 }, { "epoch": 0.92, "learning_rate": 8.630963300744644e-08, "loss": 1.1668, "step": 30494 }, { "epoch": 0.92, "learning_rate": 8.624610540231421e-08, "loss": 1.0726, "step": 30495 }, { "epoch": 0.92, "learning_rate": 8.618260077495665e-08, "loss": 1.0926, "step": 30496 }, { "epoch": 0.92, "learning_rate": 8.611911912597831e-08, "loss": 1.1602, "step": 30497 }, { "epoch": 0.92, "learning_rate": 8.605566045598312e-08, "loss": 1.1158, "step": 30498 }, { "epoch": 0.92, "learning_rate": 8.599222476557589e-08, "loss": 1.034, "step": 30499 }, { "epoch": 0.92, "learning_rate": 8.592881205535974e-08, "loss": 1.1796, "step": 30500 }, { "epoch": 0.92, "learning_rate": 8.586542232593864e-08, "loss": 1.1564, "step": 30501 }, { "epoch": 0.92, "learning_rate": 8.580205557791599e-08, "loss": 1.1589, "step": 30502 }, { "epoch": 0.92, "learning_rate": 8.573871181189547e-08, "loss": 1.1059, "step": 30503 }, { "epoch": 0.92, "learning_rate": 8.567539102847939e-08, "loss": 1.1472, "step": 30504 }, { "epoch": 0.92, "learning_rate": 8.561209322827086e-08, "loss": 1.157, "step": 30505 }, { "epoch": 0.92, "learning_rate": 8.554881841187217e-08, "loss": 1.0976, "step": 30506 }, { "epoch": 0.92, "learning_rate": 8.548556657988649e-08, "loss": 0.9608, "step": 30507 }, { "epoch": 0.92, "learning_rate": 8.54223377329147e-08, "loss": 1.0883, "step": 30508 }, { "epoch": 0.92, "learning_rate": 8.535913187155964e-08, "loss": 1.0617, "step": 30509 }, { "epoch": 0.92, "learning_rate": 8.529594899642252e-08, "loss": 1.2209, "step": 30510 }, { "epoch": 0.92, "learning_rate": 8.523278910810506e-08, "loss": 1.1141, "step": 30511 }, { "epoch": 0.92, "learning_rate": 8.516965220720902e-08, "loss": 0.9969, "step": 30512 }, { "epoch": 0.92, "learning_rate": 8.510653829433418e-08, "loss": 1.2489, "step": 30513 }, { "epoch": 0.92, "learning_rate": 8.50434473700823e-08, "loss": 1.1693, "step": 30514 }, { "epoch": 0.92, "learning_rate": 8.498037943505344e-08, "loss": 1.1241, "step": 30515 }, { "epoch": 0.92, "learning_rate": 8.491733448984879e-08, "loss": 1.1484, "step": 30516 }, { "epoch": 0.92, "learning_rate": 8.48543125350676e-08, "loss": 1.1508, "step": 30517 }, { "epoch": 0.92, "learning_rate": 8.47913135713102e-08, "loss": 1.1929, "step": 30518 }, { "epoch": 0.92, "learning_rate": 8.472833759917642e-08, "loss": 1.0512, "step": 30519 }, { "epoch": 0.92, "learning_rate": 8.466538461926576e-08, "loss": 1.2024, "step": 30520 }, { "epoch": 0.92, "learning_rate": 8.460245463217692e-08, "loss": 1.0602, "step": 30521 }, { "epoch": 0.92, "learning_rate": 8.453954763850969e-08, "loss": 1.0209, "step": 30522 }, { "epoch": 0.92, "learning_rate": 8.447666363886248e-08, "loss": 0.9625, "step": 30523 }, { "epoch": 0.92, "learning_rate": 8.441380263383425e-08, "loss": 1.2227, "step": 30524 }, { "epoch": 0.92, "learning_rate": 8.435096462402315e-08, "loss": 1.1405, "step": 30525 }, { "epoch": 0.92, "learning_rate": 8.428814961002757e-08, "loss": 1.0876, "step": 30526 }, { "epoch": 0.92, "learning_rate": 8.42253575924451e-08, "loss": 1.1743, "step": 30527 }, { "epoch": 0.92, "learning_rate": 8.416258857187387e-08, "loss": 1.0023, "step": 30528 }, { "epoch": 0.92, "learning_rate": 8.409984254891174e-08, "loss": 1.0104, "step": 30529 }, { "epoch": 0.92, "learning_rate": 8.403711952415489e-08, "loss": 1.1945, "step": 30530 }, { "epoch": 0.92, "learning_rate": 8.397441949820145e-08, "loss": 1.1052, "step": 30531 }, { "epoch": 0.92, "learning_rate": 8.391174247164791e-08, "loss": 1.0769, "step": 30532 }, { "epoch": 0.92, "learning_rate": 8.384908844509099e-08, "loss": 1.2246, "step": 30533 }, { "epoch": 0.92, "learning_rate": 8.378645741912688e-08, "loss": 1.0657, "step": 30534 }, { "epoch": 0.92, "learning_rate": 8.372384939435235e-08, "loss": 1.0405, "step": 30535 }, { "epoch": 0.92, "learning_rate": 8.366126437136274e-08, "loss": 1.2288, "step": 30536 }, { "epoch": 0.92, "learning_rate": 8.359870235075451e-08, "loss": 1.1039, "step": 30537 }, { "epoch": 0.92, "learning_rate": 8.353616333312248e-08, "loss": 1.0627, "step": 30538 }, { "epoch": 0.92, "learning_rate": 8.347364731906226e-08, "loss": 1.007, "step": 30539 }, { "epoch": 0.92, "learning_rate": 8.341115430916952e-08, "loss": 1.0574, "step": 30540 }, { "epoch": 0.92, "learning_rate": 8.33486843040382e-08, "loss": 1.0883, "step": 30541 }, { "epoch": 0.92, "learning_rate": 8.328623730426422e-08, "loss": 1.0951, "step": 30542 }, { "epoch": 0.92, "learning_rate": 8.322381331044071e-08, "loss": 1.1556, "step": 30543 }, { "epoch": 0.92, "learning_rate": 8.316141232316277e-08, "loss": 1.0987, "step": 30544 }, { "epoch": 0.92, "learning_rate": 8.309903434302407e-08, "loss": 1.1225, "step": 30545 }, { "epoch": 0.92, "learning_rate": 8.303667937061887e-08, "loss": 1.0955, "step": 30546 }, { "epoch": 0.92, "learning_rate": 8.29743474065403e-08, "loss": 1.0833, "step": 30547 }, { "epoch": 0.92, "learning_rate": 8.291203845138179e-08, "loss": 1.1027, "step": 30548 }, { "epoch": 0.92, "learning_rate": 8.284975250573646e-08, "loss": 1.1443, "step": 30549 }, { "epoch": 0.92, "learning_rate": 8.278748957019717e-08, "loss": 1.05, "step": 30550 }, { "epoch": 0.92, "learning_rate": 8.272524964535733e-08, "loss": 1.101, "step": 30551 }, { "epoch": 0.92, "learning_rate": 8.26630327318087e-08, "loss": 1.0634, "step": 30552 }, { "epoch": 0.92, "learning_rate": 8.260083883014358e-08, "loss": 1.0057, "step": 30553 }, { "epoch": 0.92, "learning_rate": 8.253866794095456e-08, "loss": 1.0273, "step": 30554 }, { "epoch": 0.92, "learning_rate": 8.247652006483281e-08, "loss": 1.1104, "step": 30555 }, { "epoch": 0.92, "learning_rate": 8.241439520237037e-08, "loss": 1.0883, "step": 30556 }, { "epoch": 0.92, "learning_rate": 8.235229335415845e-08, "loss": 1.0142, "step": 30557 }, { "epoch": 0.92, "learning_rate": 8.229021452078823e-08, "loss": 1.0903, "step": 30558 }, { "epoch": 0.92, "learning_rate": 8.222815870285116e-08, "loss": 1.0501, "step": 30559 }, { "epoch": 0.92, "learning_rate": 8.216612590093737e-08, "loss": 1.0735, "step": 30560 }, { "epoch": 0.92, "learning_rate": 8.210411611563773e-08, "loss": 1.1668, "step": 30561 }, { "epoch": 0.92, "learning_rate": 8.204212934754207e-08, "loss": 1.1851, "step": 30562 }, { "epoch": 0.92, "learning_rate": 8.198016559724132e-08, "loss": 1.0135, "step": 30563 }, { "epoch": 0.92, "learning_rate": 8.191822486532441e-08, "loss": 1.1516, "step": 30564 }, { "epoch": 0.92, "learning_rate": 8.185630715238147e-08, "loss": 1.1046, "step": 30565 }, { "epoch": 0.92, "learning_rate": 8.179441245900199e-08, "loss": 1.1033, "step": 30566 }, { "epoch": 0.92, "learning_rate": 8.173254078577498e-08, "loss": 1.0989, "step": 30567 }, { "epoch": 0.92, "learning_rate": 8.167069213328966e-08, "loss": 1.1301, "step": 30568 }, { "epoch": 0.92, "learning_rate": 8.160886650213445e-08, "loss": 1.201, "step": 30569 }, { "epoch": 0.92, "learning_rate": 8.154706389289807e-08, "loss": 1.0704, "step": 30570 }, { "epoch": 0.92, "learning_rate": 8.148528430616892e-08, "loss": 1.0829, "step": 30571 }, { "epoch": 0.92, "learning_rate": 8.142352774253543e-08, "loss": 1.063, "step": 30572 }, { "epoch": 0.92, "learning_rate": 8.136179420258461e-08, "loss": 0.9626, "step": 30573 }, { "epoch": 0.92, "learning_rate": 8.130008368690489e-08, "loss": 1.1294, "step": 30574 }, { "epoch": 0.92, "learning_rate": 8.123839619608332e-08, "loss": 1.0543, "step": 30575 }, { "epoch": 0.92, "learning_rate": 8.117673173070772e-08, "loss": 1.0355, "step": 30576 }, { "epoch": 0.92, "learning_rate": 8.111509029136433e-08, "loss": 1.0939, "step": 30577 }, { "epoch": 0.92, "learning_rate": 8.105347187864044e-08, "loss": 1.1318, "step": 30578 }, { "epoch": 0.92, "learning_rate": 8.099187649312223e-08, "loss": 1.1124, "step": 30579 }, { "epoch": 0.92, "learning_rate": 8.093030413539648e-08, "loss": 1.1084, "step": 30580 }, { "epoch": 0.92, "learning_rate": 8.086875480604911e-08, "loss": 1.2719, "step": 30581 }, { "epoch": 0.92, "learning_rate": 8.08072285056663e-08, "loss": 1.0742, "step": 30582 }, { "epoch": 0.92, "learning_rate": 8.074572523483342e-08, "loss": 1.0484, "step": 30583 }, { "epoch": 0.92, "learning_rate": 8.068424499413586e-08, "loss": 1.085, "step": 30584 }, { "epoch": 0.92, "learning_rate": 8.062278778415977e-08, "loss": 1.1362, "step": 30585 }, { "epoch": 0.92, "learning_rate": 8.056135360548889e-08, "loss": 1.1782, "step": 30586 }, { "epoch": 0.92, "learning_rate": 8.049994245870884e-08, "loss": 1.1513, "step": 30587 }, { "epoch": 0.92, "learning_rate": 8.043855434440417e-08, "loss": 1.1465, "step": 30588 }, { "epoch": 0.92, "learning_rate": 8.03771892631594e-08, "loss": 1.0614, "step": 30589 }, { "epoch": 0.92, "learning_rate": 8.031584721555796e-08, "loss": 1.0335, "step": 30590 }, { "epoch": 0.92, "learning_rate": 8.025452820218465e-08, "loss": 1.1329, "step": 30591 }, { "epoch": 0.92, "learning_rate": 8.019323222362263e-08, "loss": 1.0732, "step": 30592 }, { "epoch": 0.92, "learning_rate": 8.013195928045559e-08, "loss": 1.1572, "step": 30593 }, { "epoch": 0.92, "learning_rate": 8.007070937326722e-08, "loss": 1.1501, "step": 30594 }, { "epoch": 0.92, "learning_rate": 8.000948250263985e-08, "loss": 1.165, "step": 30595 }, { "epoch": 0.92, "learning_rate": 7.994827866915689e-08, "loss": 1.1085, "step": 30596 }, { "epoch": 0.92, "learning_rate": 7.988709787340066e-08, "loss": 1.1391, "step": 30597 }, { "epoch": 0.92, "learning_rate": 7.982594011595374e-08, "loss": 1.0449, "step": 30598 }, { "epoch": 0.92, "learning_rate": 7.976480539739844e-08, "loss": 1.0677, "step": 30599 }, { "epoch": 0.92, "learning_rate": 7.970369371831627e-08, "loss": 1.1476, "step": 30600 }, { "epoch": 0.92, "learning_rate": 7.964260507928922e-08, "loss": 1.0673, "step": 30601 }, { "epoch": 0.92, "learning_rate": 7.958153948089936e-08, "loss": 1.1002, "step": 30602 }, { "epoch": 0.92, "learning_rate": 7.952049692372732e-08, "loss": 1.0645, "step": 30603 }, { "epoch": 0.92, "learning_rate": 7.945947740835402e-08, "loss": 1.0286, "step": 30604 }, { "epoch": 0.92, "learning_rate": 7.939848093536095e-08, "loss": 1.0975, "step": 30605 }, { "epoch": 0.92, "learning_rate": 7.933750750532876e-08, "loss": 1.0598, "step": 30606 }, { "epoch": 0.92, "learning_rate": 7.927655711883753e-08, "loss": 1.0823, "step": 30607 }, { "epoch": 0.92, "learning_rate": 7.921562977646735e-08, "loss": 1.0822, "step": 30608 }, { "epoch": 0.92, "learning_rate": 7.915472547879888e-08, "loss": 1.0577, "step": 30609 }, { "epoch": 0.92, "learning_rate": 7.909384422641108e-08, "loss": 1.0541, "step": 30610 }, { "epoch": 0.92, "learning_rate": 7.903298601988463e-08, "loss": 1.1808, "step": 30611 }, { "epoch": 0.92, "learning_rate": 7.897215085979764e-08, "loss": 1.1544, "step": 30612 }, { "epoch": 0.92, "learning_rate": 7.891133874672996e-08, "loss": 1.0802, "step": 30613 }, { "epoch": 0.92, "learning_rate": 7.885054968126e-08, "loss": 1.0895, "step": 30614 }, { "epoch": 0.92, "learning_rate": 7.878978366396728e-08, "loss": 1.058, "step": 30615 }, { "epoch": 0.92, "learning_rate": 7.872904069542942e-08, "loss": 1.1178, "step": 30616 }, { "epoch": 0.92, "learning_rate": 7.866832077622483e-08, "loss": 1.1858, "step": 30617 }, { "epoch": 0.92, "learning_rate": 7.860762390693193e-08, "loss": 0.9603, "step": 30618 }, { "epoch": 0.92, "learning_rate": 7.854695008812807e-08, "loss": 1.0609, "step": 30619 }, { "epoch": 0.92, "learning_rate": 7.848629932039137e-08, "loss": 1.0275, "step": 30620 }, { "epoch": 0.92, "learning_rate": 7.842567160429832e-08, "loss": 1.0592, "step": 30621 }, { "epoch": 0.92, "learning_rate": 7.836506694042705e-08, "loss": 1.1694, "step": 30622 }, { "epoch": 0.92, "learning_rate": 7.83044853293538e-08, "loss": 1.1402, "step": 30623 }, { "epoch": 0.92, "learning_rate": 7.824392677165587e-08, "loss": 1.1599, "step": 30624 }, { "epoch": 0.92, "learning_rate": 7.818339126790892e-08, "loss": 1.104, "step": 30625 }, { "epoch": 0.92, "learning_rate": 7.812287881868997e-08, "loss": 1.1316, "step": 30626 }, { "epoch": 0.92, "learning_rate": 7.806238942457467e-08, "loss": 1.012, "step": 30627 }, { "epoch": 0.92, "learning_rate": 7.800192308613924e-08, "loss": 1.0432, "step": 30628 }, { "epoch": 0.92, "learning_rate": 7.794147980395878e-08, "loss": 0.9991, "step": 30629 }, { "epoch": 0.92, "learning_rate": 7.788105957860892e-08, "loss": 1.1276, "step": 30630 }, { "epoch": 0.92, "learning_rate": 7.782066241066477e-08, "loss": 1.0999, "step": 30631 }, { "epoch": 0.92, "learning_rate": 7.776028830070142e-08, "loss": 1.0798, "step": 30632 }, { "epoch": 0.92, "learning_rate": 7.769993724929398e-08, "loss": 1.0998, "step": 30633 }, { "epoch": 0.92, "learning_rate": 7.763960925701613e-08, "loss": 1.1025, "step": 30634 }, { "epoch": 0.92, "learning_rate": 7.757930432444244e-08, "loss": 1.1008, "step": 30635 }, { "epoch": 0.92, "learning_rate": 7.751902245214715e-08, "loss": 1.1185, "step": 30636 }, { "epoch": 0.92, "learning_rate": 7.745876364070399e-08, "loss": 1.1906, "step": 30637 }, { "epoch": 0.92, "learning_rate": 7.739852789068692e-08, "loss": 0.9509, "step": 30638 }, { "epoch": 0.92, "learning_rate": 7.733831520266882e-08, "loss": 1.1423, "step": 30639 }, { "epoch": 0.92, "learning_rate": 7.727812557722314e-08, "loss": 1.0574, "step": 30640 }, { "epoch": 0.92, "learning_rate": 7.72179590149233e-08, "loss": 1.0655, "step": 30641 }, { "epoch": 0.92, "learning_rate": 7.715781551634133e-08, "loss": 1.0873, "step": 30642 }, { "epoch": 0.92, "learning_rate": 7.709769508205012e-08, "loss": 0.9855, "step": 30643 }, { "epoch": 0.92, "learning_rate": 7.703759771262199e-08, "loss": 1.1409, "step": 30644 }, { "epoch": 0.92, "learning_rate": 7.697752340862896e-08, "loss": 1.0752, "step": 30645 }, { "epoch": 0.92, "learning_rate": 7.69174721706431e-08, "loss": 1.1098, "step": 30646 }, { "epoch": 0.92, "learning_rate": 7.685744399923589e-08, "loss": 0.9827, "step": 30647 }, { "epoch": 0.92, "learning_rate": 7.679743889497854e-08, "loss": 1.1846, "step": 30648 }, { "epoch": 0.92, "learning_rate": 7.673745685844253e-08, "loss": 1.122, "step": 30649 }, { "epoch": 0.92, "learning_rate": 7.667749789019907e-08, "loss": 1.029, "step": 30650 }, { "epoch": 0.92, "learning_rate": 7.661756199081855e-08, "loss": 1.0733, "step": 30651 }, { "epoch": 0.92, "learning_rate": 7.655764916087189e-08, "loss": 1.1695, "step": 30652 }, { "epoch": 0.92, "learning_rate": 7.649775940092891e-08, "loss": 1.0843, "step": 30653 }, { "epoch": 0.92, "learning_rate": 7.643789271156054e-08, "loss": 1.0363, "step": 30654 }, { "epoch": 0.92, "learning_rate": 7.63780490933358e-08, "loss": 1.1336, "step": 30655 }, { "epoch": 0.92, "learning_rate": 7.631822854682502e-08, "loss": 1.1376, "step": 30656 }, { "epoch": 0.92, "learning_rate": 7.625843107259723e-08, "loss": 1.0814, "step": 30657 }, { "epoch": 0.92, "learning_rate": 7.619865667122167e-08, "loss": 1.1558, "step": 30658 }, { "epoch": 0.92, "learning_rate": 7.613890534326818e-08, "loss": 1.0652, "step": 30659 }, { "epoch": 0.92, "learning_rate": 7.607917708930435e-08, "loss": 1.0194, "step": 30660 }, { "epoch": 0.92, "learning_rate": 7.601947190989972e-08, "loss": 1.0654, "step": 30661 }, { "epoch": 0.92, "learning_rate": 7.59597898056219e-08, "loss": 1.0372, "step": 30662 }, { "epoch": 0.92, "learning_rate": 7.590013077703962e-08, "loss": 1.1396, "step": 30663 }, { "epoch": 0.92, "learning_rate": 7.584049482472072e-08, "loss": 1.0148, "step": 30664 }, { "epoch": 0.92, "learning_rate": 7.578088194923256e-08, "loss": 1.0956, "step": 30665 }, { "epoch": 0.92, "learning_rate": 7.572129215114299e-08, "loss": 1.1593, "step": 30666 }, { "epoch": 0.92, "learning_rate": 7.566172543101935e-08, "loss": 1.1046, "step": 30667 }, { "epoch": 0.92, "learning_rate": 7.56021817894284e-08, "loss": 1.1355, "step": 30668 }, { "epoch": 0.92, "learning_rate": 7.554266122693693e-08, "loss": 1.1516, "step": 30669 }, { "epoch": 0.92, "learning_rate": 7.548316374411169e-08, "loss": 1.1938, "step": 30670 }, { "epoch": 0.92, "learning_rate": 7.542368934151889e-08, "loss": 1.0941, "step": 30671 }, { "epoch": 0.92, "learning_rate": 7.536423801972531e-08, "loss": 1.0675, "step": 30672 }, { "epoch": 0.92, "learning_rate": 7.530480977929605e-08, "loss": 1.1665, "step": 30673 }, { "epoch": 0.92, "learning_rate": 7.524540462079732e-08, "loss": 1.1281, "step": 30674 }, { "epoch": 0.92, "learning_rate": 7.518602254479451e-08, "loss": 1.1456, "step": 30675 }, { "epoch": 0.92, "learning_rate": 7.512666355185299e-08, "loss": 1.0975, "step": 30676 }, { "epoch": 0.92, "learning_rate": 7.506732764253787e-08, "loss": 1.0509, "step": 30677 }, { "epoch": 0.92, "learning_rate": 7.50080148174137e-08, "loss": 1.0517, "step": 30678 }, { "epoch": 0.92, "learning_rate": 7.494872507704531e-08, "loss": 1.1227, "step": 30679 }, { "epoch": 0.92, "learning_rate": 7.488945842199752e-08, "loss": 1.0679, "step": 30680 }, { "epoch": 0.92, "learning_rate": 7.483021485283376e-08, "loss": 1.1375, "step": 30681 }, { "epoch": 0.92, "learning_rate": 7.47709943701183e-08, "loss": 1.1508, "step": 30682 }, { "epoch": 0.92, "learning_rate": 7.471179697441489e-08, "loss": 1.1603, "step": 30683 }, { "epoch": 0.92, "learning_rate": 7.46526226662872e-08, "loss": 1.0898, "step": 30684 }, { "epoch": 0.92, "learning_rate": 7.45934714462987e-08, "loss": 1.1282, "step": 30685 }, { "epoch": 0.92, "learning_rate": 7.453434331501197e-08, "loss": 1.022, "step": 30686 }, { "epoch": 0.92, "learning_rate": 7.44752382729902e-08, "loss": 1.2087, "step": 30687 }, { "epoch": 0.92, "learning_rate": 7.441615632079596e-08, "loss": 1.0925, "step": 30688 }, { "epoch": 0.92, "learning_rate": 7.43570974589916e-08, "loss": 1.1952, "step": 30689 }, { "epoch": 0.92, "learning_rate": 7.429806168813975e-08, "loss": 1.1181, "step": 30690 }, { "epoch": 0.92, "learning_rate": 7.423904900880185e-08, "loss": 1.0826, "step": 30691 }, { "epoch": 0.92, "learning_rate": 7.418005942154e-08, "loss": 1.1595, "step": 30692 }, { "epoch": 0.92, "learning_rate": 7.412109292691567e-08, "loss": 1.138, "step": 30693 }, { "epoch": 0.92, "learning_rate": 7.406214952549035e-08, "loss": 1.0889, "step": 30694 }, { "epoch": 0.92, "learning_rate": 7.400322921782471e-08, "loss": 1.1063, "step": 30695 }, { "epoch": 0.92, "learning_rate": 7.394433200447997e-08, "loss": 1.0376, "step": 30696 }, { "epoch": 0.92, "learning_rate": 7.388545788601681e-08, "loss": 0.9965, "step": 30697 }, { "epoch": 0.92, "learning_rate": 7.382660686299587e-08, "loss": 1.1772, "step": 30698 }, { "epoch": 0.92, "learning_rate": 7.376777893597697e-08, "loss": 1.0776, "step": 30699 }, { "epoch": 0.92, "learning_rate": 7.370897410552025e-08, "loss": 1.0886, "step": 30700 }, { "epoch": 0.92, "learning_rate": 7.365019237218552e-08, "loss": 1.163, "step": 30701 }, { "epoch": 0.92, "learning_rate": 7.35914337365326e-08, "loss": 1.0336, "step": 30702 }, { "epoch": 0.92, "learning_rate": 7.353269819912051e-08, "loss": 1.1246, "step": 30703 }, { "epoch": 0.92, "learning_rate": 7.347398576050852e-08, "loss": 1.1182, "step": 30704 }, { "epoch": 0.92, "learning_rate": 7.341529642125533e-08, "loss": 1.1709, "step": 30705 }, { "epoch": 0.93, "learning_rate": 7.335663018192024e-08, "loss": 1.21, "step": 30706 }, { "epoch": 0.93, "learning_rate": 7.329798704306112e-08, "loss": 1.075, "step": 30707 }, { "epoch": 0.93, "learning_rate": 7.323936700523615e-08, "loss": 1.06, "step": 30708 }, { "epoch": 0.93, "learning_rate": 7.318077006900404e-08, "loss": 1.1212, "step": 30709 }, { "epoch": 0.93, "learning_rate": 7.312219623492184e-08, "loss": 1.0229, "step": 30710 }, { "epoch": 0.93, "learning_rate": 7.306364550354799e-08, "loss": 1.0942, "step": 30711 }, { "epoch": 0.93, "learning_rate": 7.300511787543902e-08, "loss": 1.0807, "step": 30712 }, { "epoch": 0.93, "learning_rate": 7.29466133511525e-08, "loss": 1.1318, "step": 30713 }, { "epoch": 0.93, "learning_rate": 7.288813193124522e-08, "loss": 1.1026, "step": 30714 }, { "epoch": 0.93, "learning_rate": 7.282967361627424e-08, "loss": 1.1161, "step": 30715 }, { "epoch": 0.93, "learning_rate": 7.277123840679579e-08, "loss": 1.0812, "step": 30716 }, { "epoch": 0.93, "learning_rate": 7.271282630336579e-08, "loss": 1.1769, "step": 30717 }, { "epoch": 0.93, "learning_rate": 7.265443730654103e-08, "loss": 1.2069, "step": 30718 }, { "epoch": 0.93, "learning_rate": 7.259607141687664e-08, "loss": 1.1172, "step": 30719 }, { "epoch": 0.93, "learning_rate": 7.253772863492881e-08, "loss": 1.111, "step": 30720 }, { "epoch": 0.93, "learning_rate": 7.247940896125266e-08, "loss": 1.1535, "step": 30721 }, { "epoch": 0.93, "learning_rate": 7.242111239640331e-08, "loss": 1.1101, "step": 30722 }, { "epoch": 0.93, "learning_rate": 7.236283894093615e-08, "loss": 1.1687, "step": 30723 }, { "epoch": 0.93, "learning_rate": 7.230458859540517e-08, "loss": 0.971, "step": 30724 }, { "epoch": 0.93, "learning_rate": 7.22463613603655e-08, "loss": 1.0965, "step": 30725 }, { "epoch": 0.93, "learning_rate": 7.218815723637112e-08, "loss": 1.0715, "step": 30726 }, { "epoch": 0.93, "learning_rate": 7.212997622397633e-08, "loss": 1.0887, "step": 30727 }, { "epoch": 0.93, "learning_rate": 7.207181832373483e-08, "loss": 1.0558, "step": 30728 }, { "epoch": 0.93, "learning_rate": 7.201368353620036e-08, "loss": 1.0311, "step": 30729 }, { "epoch": 0.93, "learning_rate": 7.19555718619261e-08, "loss": 1.1321, "step": 30730 }, { "epoch": 0.93, "learning_rate": 7.189748330146545e-08, "loss": 1.0734, "step": 30731 }, { "epoch": 0.93, "learning_rate": 7.183941785537163e-08, "loss": 0.9744, "step": 30732 }, { "epoch": 0.93, "learning_rate": 7.178137552419667e-08, "loss": 1.0937, "step": 30733 }, { "epoch": 0.93, "learning_rate": 7.172335630849375e-08, "loss": 1.1313, "step": 30734 }, { "epoch": 0.93, "learning_rate": 7.166536020881493e-08, "loss": 1.1775, "step": 30735 }, { "epoch": 0.93, "learning_rate": 7.160738722571254e-08, "loss": 1.238, "step": 30736 }, { "epoch": 0.93, "learning_rate": 7.154943735973807e-08, "loss": 1.0865, "step": 30737 }, { "epoch": 0.93, "learning_rate": 7.149151061144333e-08, "loss": 1.1992, "step": 30738 }, { "epoch": 0.93, "learning_rate": 7.14336069813798e-08, "loss": 1.1265, "step": 30739 }, { "epoch": 0.93, "learning_rate": 7.137572647009872e-08, "loss": 1.0411, "step": 30740 }, { "epoch": 0.93, "learning_rate": 7.13178690781513e-08, "loss": 1.136, "step": 30741 }, { "epoch": 0.93, "learning_rate": 7.126003480608795e-08, "loss": 1.0416, "step": 30742 }, { "epoch": 0.93, "learning_rate": 7.120222365445906e-08, "loss": 1.1703, "step": 30743 }, { "epoch": 0.93, "learning_rate": 7.114443562381557e-08, "loss": 1.0835, "step": 30744 }, { "epoch": 0.93, "learning_rate": 7.108667071470704e-08, "loss": 1.0715, "step": 30745 }, { "epoch": 0.93, "learning_rate": 7.10289289276836e-08, "loss": 1.0442, "step": 30746 }, { "epoch": 0.93, "learning_rate": 7.097121026329507e-08, "loss": 1.0239, "step": 30747 }, { "epoch": 0.93, "learning_rate": 7.091351472209074e-08, "loss": 1.0775, "step": 30748 }, { "epoch": 0.93, "learning_rate": 7.085584230462017e-08, "loss": 1.0516, "step": 30749 }, { "epoch": 0.93, "learning_rate": 7.079819301143154e-08, "loss": 1.1494, "step": 30750 }, { "epoch": 0.93, "learning_rate": 7.07405668430744e-08, "loss": 1.0337, "step": 30751 }, { "epoch": 0.93, "learning_rate": 7.068296380009721e-08, "loss": 1.1262, "step": 30752 }, { "epoch": 0.93, "learning_rate": 7.062538388304785e-08, "loss": 1.0052, "step": 30753 }, { "epoch": 0.93, "learning_rate": 7.056782709247533e-08, "loss": 1.1575, "step": 30754 }, { "epoch": 0.93, "learning_rate": 7.051029342892673e-08, "loss": 1.1248, "step": 30755 }, { "epoch": 0.93, "learning_rate": 7.045278289294993e-08, "loss": 1.1708, "step": 30756 }, { "epoch": 0.93, "learning_rate": 7.039529548509283e-08, "loss": 1.1108, "step": 30757 }, { "epoch": 0.93, "learning_rate": 7.033783120590221e-08, "loss": 1.1567, "step": 30758 }, { "epoch": 0.93, "learning_rate": 7.02803900559254e-08, "loss": 1.198, "step": 30759 }, { "epoch": 0.93, "learning_rate": 7.022297203570893e-08, "loss": 1.0408, "step": 30760 }, { "epoch": 0.93, "learning_rate": 7.016557714579958e-08, "loss": 1.2306, "step": 30761 }, { "epoch": 0.93, "learning_rate": 7.010820538674385e-08, "loss": 1.1153, "step": 30762 }, { "epoch": 0.93, "learning_rate": 7.00508567590874e-08, "loss": 1.062, "step": 30763 }, { "epoch": 0.93, "learning_rate": 6.999353126337677e-08, "loss": 1.0692, "step": 30764 }, { "epoch": 0.93, "learning_rate": 6.993622890015706e-08, "loss": 1.0834, "step": 30765 }, { "epoch": 0.93, "learning_rate": 6.987894966997422e-08, "loss": 1.04, "step": 30766 }, { "epoch": 0.93, "learning_rate": 6.982169357337393e-08, "loss": 1.1181, "step": 30767 }, { "epoch": 0.93, "learning_rate": 6.97644606109002e-08, "loss": 1.1124, "step": 30768 }, { "epoch": 0.93, "learning_rate": 6.970725078309814e-08, "loss": 1.0764, "step": 30769 }, { "epoch": 0.93, "learning_rate": 6.96500640905129e-08, "loss": 1.0857, "step": 30770 }, { "epoch": 0.93, "learning_rate": 6.959290053368845e-08, "loss": 1.059, "step": 30771 }, { "epoch": 0.93, "learning_rate": 6.953576011316909e-08, "loss": 1.1082, "step": 30772 }, { "epoch": 0.93, "learning_rate": 6.947864282949884e-08, "loss": 1.1439, "step": 30773 }, { "epoch": 0.93, "learning_rate": 6.942154868322116e-08, "loss": 1.1569, "step": 30774 }, { "epoch": 0.93, "learning_rate": 6.936447767488002e-08, "loss": 1.0706, "step": 30775 }, { "epoch": 0.93, "learning_rate": 6.930742980501836e-08, "loss": 1.0485, "step": 30776 }, { "epoch": 0.93, "learning_rate": 6.925040507417907e-08, "loss": 1.0971, "step": 30777 }, { "epoch": 0.93, "learning_rate": 6.919340348290532e-08, "loss": 1.0084, "step": 30778 }, { "epoch": 0.93, "learning_rate": 6.913642503173945e-08, "loss": 1.1305, "step": 30779 }, { "epoch": 0.93, "learning_rate": 6.907946972122464e-08, "loss": 1.0756, "step": 30780 }, { "epoch": 0.93, "learning_rate": 6.902253755190214e-08, "loss": 1.1714, "step": 30781 }, { "epoch": 0.93, "learning_rate": 6.896562852431427e-08, "loss": 1.1064, "step": 30782 }, { "epoch": 0.93, "learning_rate": 6.890874263900282e-08, "loss": 1.0712, "step": 30783 }, { "epoch": 0.93, "learning_rate": 6.88518798965096e-08, "loss": 1.0967, "step": 30784 }, { "epoch": 0.93, "learning_rate": 6.879504029737499e-08, "loss": 1.1074, "step": 30785 }, { "epoch": 0.93, "learning_rate": 6.873822384214107e-08, "loss": 1.0457, "step": 30786 }, { "epoch": 0.93, "learning_rate": 6.868143053134823e-08, "loss": 1.0732, "step": 30787 }, { "epoch": 0.93, "learning_rate": 6.862466036553744e-08, "loss": 1.1296, "step": 30788 }, { "epoch": 0.93, "learning_rate": 6.856791334524854e-08, "loss": 0.9824, "step": 30789 }, { "epoch": 0.93, "learning_rate": 6.85111894710222e-08, "loss": 1.0837, "step": 30790 }, { "epoch": 0.93, "learning_rate": 6.845448874339828e-08, "loss": 1.1108, "step": 30791 }, { "epoch": 0.93, "learning_rate": 6.83978111629166e-08, "loss": 1.1322, "step": 30792 }, { "epoch": 0.93, "learning_rate": 6.834115673011676e-08, "loss": 1.0284, "step": 30793 }, { "epoch": 0.93, "learning_rate": 6.828452544553804e-08, "loss": 1.1453, "step": 30794 }, { "epoch": 0.93, "learning_rate": 6.822791730971917e-08, "loss": 1.0989, "step": 30795 }, { "epoch": 0.93, "learning_rate": 6.817133232319945e-08, "loss": 1.0936, "step": 30796 }, { "epoch": 0.93, "learning_rate": 6.811477048651733e-08, "loss": 1.0264, "step": 30797 }, { "epoch": 0.93, "learning_rate": 6.805823180021182e-08, "loss": 1.055, "step": 30798 }, { "epoch": 0.93, "learning_rate": 6.800171626482028e-08, "loss": 1.0484, "step": 30799 }, { "epoch": 0.93, "learning_rate": 6.794522388088116e-08, "loss": 1.1406, "step": 30800 }, { "epoch": 0.93, "learning_rate": 6.788875464893235e-08, "loss": 1.0436, "step": 30801 }, { "epoch": 0.93, "learning_rate": 6.783230856951095e-08, "loss": 1.1438, "step": 30802 }, { "epoch": 0.93, "learning_rate": 6.777588564315485e-08, "loss": 0.9891, "step": 30803 }, { "epoch": 0.93, "learning_rate": 6.771948587040084e-08, "loss": 1.1594, "step": 30804 }, { "epoch": 0.93, "learning_rate": 6.76631092517857e-08, "loss": 1.2147, "step": 30805 }, { "epoch": 0.93, "learning_rate": 6.760675578784681e-08, "loss": 1.1118, "step": 30806 }, { "epoch": 0.93, "learning_rate": 6.755042547911983e-08, "loss": 1.0166, "step": 30807 }, { "epoch": 0.93, "learning_rate": 6.749411832614127e-08, "loss": 1.1112, "step": 30808 }, { "epoch": 0.93, "learning_rate": 6.743783432944712e-08, "loss": 1.0369, "step": 30809 }, { "epoch": 0.93, "learning_rate": 6.738157348957358e-08, "loss": 1.0752, "step": 30810 }, { "epoch": 0.93, "learning_rate": 6.732533580705552e-08, "loss": 1.1857, "step": 30811 }, { "epoch": 0.93, "learning_rate": 6.726912128242862e-08, "loss": 1.1941, "step": 30812 }, { "epoch": 0.93, "learning_rate": 6.721292991622802e-08, "loss": 1.0972, "step": 30813 }, { "epoch": 0.93, "learning_rate": 6.71567617089891e-08, "loss": 1.1719, "step": 30814 }, { "epoch": 0.93, "learning_rate": 6.710061666124562e-08, "loss": 1.0741, "step": 30815 }, { "epoch": 0.93, "learning_rate": 6.70444947735327e-08, "loss": 0.9015, "step": 30816 }, { "epoch": 0.93, "learning_rate": 6.698839604638436e-08, "loss": 1.1161, "step": 30817 }, { "epoch": 0.93, "learning_rate": 6.693232048033488e-08, "loss": 1.0814, "step": 30818 }, { "epoch": 0.93, "learning_rate": 6.687626807591802e-08, "loss": 0.9781, "step": 30819 }, { "epoch": 0.93, "learning_rate": 6.682023883366695e-08, "loss": 1.1339, "step": 30820 }, { "epoch": 0.93, "learning_rate": 6.676423275411543e-08, "loss": 1.1399, "step": 30821 }, { "epoch": 0.93, "learning_rate": 6.670824983779634e-08, "loss": 1.2057, "step": 30822 }, { "epoch": 0.93, "learning_rate": 6.665229008524344e-08, "loss": 1.1254, "step": 30823 }, { "epoch": 0.93, "learning_rate": 6.659635349698824e-08, "loss": 1.1173, "step": 30824 }, { "epoch": 0.93, "learning_rate": 6.654044007356392e-08, "loss": 1.2308, "step": 30825 }, { "epoch": 0.93, "learning_rate": 6.648454981550256e-08, "loss": 1.0899, "step": 30826 }, { "epoch": 0.93, "learning_rate": 6.642868272333624e-08, "loss": 1.111, "step": 30827 }, { "epoch": 0.93, "learning_rate": 6.637283879759676e-08, "loss": 1.1253, "step": 30828 }, { "epoch": 0.93, "learning_rate": 6.63170180388159e-08, "loss": 1.1411, "step": 30829 }, { "epoch": 0.93, "learning_rate": 6.626122044752493e-08, "loss": 1.1605, "step": 30830 }, { "epoch": 0.93, "learning_rate": 6.620544602425505e-08, "loss": 1.1309, "step": 30831 }, { "epoch": 0.93, "learning_rate": 6.614969476953725e-08, "loss": 1.0281, "step": 30832 }, { "epoch": 0.93, "learning_rate": 6.609396668390195e-08, "loss": 1.055, "step": 30833 }, { "epoch": 0.93, "learning_rate": 6.603826176788008e-08, "loss": 1.0139, "step": 30834 }, { "epoch": 0.93, "learning_rate": 6.598258002200154e-08, "loss": 0.9702, "step": 30835 }, { "epoch": 0.93, "learning_rate": 6.59269214467967e-08, "loss": 1.1152, "step": 30836 }, { "epoch": 0.93, "learning_rate": 6.587128604279541e-08, "loss": 1.2303, "step": 30837 }, { "epoch": 0.93, "learning_rate": 6.581567381052673e-08, "loss": 1.077, "step": 30838 }, { "epoch": 0.93, "learning_rate": 6.576008475052076e-08, "loss": 1.0427, "step": 30839 }, { "epoch": 0.93, "learning_rate": 6.570451886330681e-08, "loss": 0.9981, "step": 30840 }, { "epoch": 0.93, "learning_rate": 6.564897614941279e-08, "loss": 0.9983, "step": 30841 }, { "epoch": 0.93, "learning_rate": 6.559345660936828e-08, "loss": 1.2135, "step": 30842 }, { "epoch": 0.93, "learning_rate": 6.553796024370174e-08, "loss": 1.1733, "step": 30843 }, { "epoch": 0.93, "learning_rate": 6.548248705294108e-08, "loss": 1.1406, "step": 30844 }, { "epoch": 0.93, "learning_rate": 6.542703703761505e-08, "loss": 0.9605, "step": 30845 }, { "epoch": 0.93, "learning_rate": 6.5371610198251e-08, "loss": 0.9961, "step": 30846 }, { "epoch": 0.93, "learning_rate": 6.531620653537656e-08, "loss": 1.1332, "step": 30847 }, { "epoch": 0.93, "learning_rate": 6.526082604951912e-08, "loss": 1.0925, "step": 30848 }, { "epoch": 0.93, "learning_rate": 6.520546874120626e-08, "loss": 1.1119, "step": 30849 }, { "epoch": 0.93, "learning_rate": 6.515013461096453e-08, "loss": 1.0815, "step": 30850 }, { "epoch": 0.93, "learning_rate": 6.509482365932074e-08, "loss": 1.0805, "step": 30851 }, { "epoch": 0.93, "learning_rate": 6.503953588680167e-08, "loss": 1.0201, "step": 30852 }, { "epoch": 0.93, "learning_rate": 6.498427129393359e-08, "loss": 1.0916, "step": 30853 }, { "epoch": 0.93, "learning_rate": 6.492902988124245e-08, "loss": 1.1446, "step": 30854 }, { "epoch": 0.93, "learning_rate": 6.487381164925394e-08, "loss": 1.1567, "step": 30855 }, { "epoch": 0.93, "learning_rate": 6.48186165984943e-08, "loss": 1.0458, "step": 30856 }, { "epoch": 0.93, "learning_rate": 6.476344472948842e-08, "loss": 0.9964, "step": 30857 }, { "epoch": 0.93, "learning_rate": 6.470829604276197e-08, "loss": 1.0895, "step": 30858 }, { "epoch": 0.93, "learning_rate": 6.465317053883924e-08, "loss": 1.1189, "step": 30859 }, { "epoch": 0.93, "learning_rate": 6.459806821824565e-08, "loss": 1.0782, "step": 30860 }, { "epoch": 0.93, "learning_rate": 6.454298908150553e-08, "loss": 1.1669, "step": 30861 }, { "epoch": 0.93, "learning_rate": 6.448793312914314e-08, "loss": 1.1698, "step": 30862 }, { "epoch": 0.93, "learning_rate": 6.443290036168282e-08, "loss": 1.1201, "step": 30863 }, { "epoch": 0.93, "learning_rate": 6.437789077964802e-08, "loss": 1.1348, "step": 30864 }, { "epoch": 0.93, "learning_rate": 6.432290438356276e-08, "loss": 1.0842, "step": 30865 }, { "epoch": 0.93, "learning_rate": 6.426794117395053e-08, "loss": 1.0463, "step": 30866 }, { "epoch": 0.93, "learning_rate": 6.421300115133423e-08, "loss": 1.1008, "step": 30867 }, { "epoch": 0.93, "learning_rate": 6.415808431623705e-08, "loss": 1.1053, "step": 30868 }, { "epoch": 0.93, "learning_rate": 6.410319066918164e-08, "loss": 1.1152, "step": 30869 }, { "epoch": 0.93, "learning_rate": 6.404832021069091e-08, "loss": 1.043, "step": 30870 }, { "epoch": 0.93, "learning_rate": 6.399347294128721e-08, "loss": 1.0164, "step": 30871 }, { "epoch": 0.93, "learning_rate": 6.393864886149209e-08, "loss": 0.9865, "step": 30872 }, { "epoch": 0.93, "learning_rate": 6.388384797182761e-08, "loss": 1.0197, "step": 30873 }, { "epoch": 0.93, "learning_rate": 6.382907027281588e-08, "loss": 1.1812, "step": 30874 }, { "epoch": 0.93, "learning_rate": 6.37743157649784e-08, "loss": 1.0669, "step": 30875 }, { "epoch": 0.93, "learning_rate": 6.371958444883558e-08, "loss": 1.1008, "step": 30876 }, { "epoch": 0.93, "learning_rate": 6.366487632490925e-08, "loss": 1.1152, "step": 30877 }, { "epoch": 0.93, "learning_rate": 6.361019139371954e-08, "loss": 0.9877, "step": 30878 }, { "epoch": 0.93, "learning_rate": 6.35555296557877e-08, "loss": 1.1229, "step": 30879 }, { "epoch": 0.93, "learning_rate": 6.350089111163416e-08, "loss": 1.0869, "step": 30880 }, { "epoch": 0.93, "learning_rate": 6.34462757617782e-08, "loss": 1.1405, "step": 30881 }, { "epoch": 0.93, "learning_rate": 6.339168360674025e-08, "loss": 1.1789, "step": 30882 }, { "epoch": 0.93, "learning_rate": 6.33371146470399e-08, "loss": 1.0963, "step": 30883 }, { "epoch": 0.93, "learning_rate": 6.328256888319672e-08, "loss": 1.0596, "step": 30884 }, { "epoch": 0.93, "learning_rate": 6.322804631573005e-08, "loss": 1.0942, "step": 30885 }, { "epoch": 0.93, "learning_rate": 6.317354694515859e-08, "loss": 1.0983, "step": 30886 }, { "epoch": 0.93, "learning_rate": 6.31190707720014e-08, "loss": 1.2254, "step": 30887 }, { "epoch": 0.93, "learning_rate": 6.306461779677753e-08, "loss": 1.032, "step": 30888 }, { "epoch": 0.93, "learning_rate": 6.30101880200043e-08, "loss": 1.1088, "step": 30889 }, { "epoch": 0.93, "learning_rate": 6.29557814422005e-08, "loss": 1.0834, "step": 30890 }, { "epoch": 0.93, "learning_rate": 6.290139806388373e-08, "loss": 0.9915, "step": 30891 }, { "epoch": 0.93, "learning_rate": 6.284703788557223e-08, "loss": 1.1487, "step": 30892 }, { "epoch": 0.93, "learning_rate": 6.279270090778306e-08, "loss": 1.0583, "step": 30893 }, { "epoch": 0.93, "learning_rate": 6.273838713103358e-08, "loss": 1.0944, "step": 30894 }, { "epoch": 0.93, "learning_rate": 6.268409655584062e-08, "loss": 1.0723, "step": 30895 }, { "epoch": 0.93, "learning_rate": 6.262982918272182e-08, "loss": 1.1932, "step": 30896 }, { "epoch": 0.93, "learning_rate": 6.257558501219257e-08, "loss": 1.2135, "step": 30897 }, { "epoch": 0.93, "learning_rate": 6.252136404477e-08, "loss": 1.0673, "step": 30898 }, { "epoch": 0.93, "learning_rate": 6.246716628097005e-08, "loss": 1.0764, "step": 30899 }, { "epoch": 0.93, "learning_rate": 6.241299172130872e-08, "loss": 1.1578, "step": 30900 }, { "epoch": 0.93, "learning_rate": 6.235884036630196e-08, "loss": 1.043, "step": 30901 }, { "epoch": 0.93, "learning_rate": 6.230471221646495e-08, "loss": 1.0322, "step": 30902 }, { "epoch": 0.93, "learning_rate": 6.22506072723128e-08, "loss": 0.9703, "step": 30903 }, { "epoch": 0.93, "learning_rate": 6.219652553436095e-08, "loss": 1.1196, "step": 30904 }, { "epoch": 0.93, "learning_rate": 6.214246700312427e-08, "loss": 1.1626, "step": 30905 }, { "epoch": 0.93, "learning_rate": 6.208843167911705e-08, "loss": 1.179, "step": 30906 }, { "epoch": 0.93, "learning_rate": 6.203441956285389e-08, "loss": 1.0377, "step": 30907 }, { "epoch": 0.93, "learning_rate": 6.198043065484882e-08, "loss": 1.1041, "step": 30908 }, { "epoch": 0.93, "learning_rate": 6.192646495561561e-08, "loss": 1.0102, "step": 30909 }, { "epoch": 0.93, "learning_rate": 6.187252246566855e-08, "loss": 1.1104, "step": 30910 }, { "epoch": 0.93, "learning_rate": 6.181860318552058e-08, "loss": 1.1157, "step": 30911 }, { "epoch": 0.93, "learning_rate": 6.176470711568544e-08, "loss": 1.1906, "step": 30912 }, { "epoch": 0.93, "learning_rate": 6.171083425667607e-08, "loss": 1.1226, "step": 30913 }, { "epoch": 0.93, "learning_rate": 6.165698460900538e-08, "loss": 1.0537, "step": 30914 }, { "epoch": 0.93, "learning_rate": 6.160315817318546e-08, "loss": 1.0817, "step": 30915 }, { "epoch": 0.93, "learning_rate": 6.154935494972925e-08, "loss": 1.1949, "step": 30916 }, { "epoch": 0.93, "learning_rate": 6.149557493914881e-08, "loss": 1.1405, "step": 30917 }, { "epoch": 0.93, "learning_rate": 6.144181814195627e-08, "loss": 1.0219, "step": 30918 }, { "epoch": 0.93, "learning_rate": 6.138808455866285e-08, "loss": 1.0428, "step": 30919 }, { "epoch": 0.93, "learning_rate": 6.133437418978038e-08, "loss": 1.1264, "step": 30920 }, { "epoch": 0.93, "learning_rate": 6.128068703582013e-08, "loss": 1.1533, "step": 30921 }, { "epoch": 0.93, "learning_rate": 6.122702309729362e-08, "loss": 1.038, "step": 30922 }, { "epoch": 0.93, "learning_rate": 6.117338237471099e-08, "loss": 1.1329, "step": 30923 }, { "epoch": 0.93, "learning_rate": 6.111976486858324e-08, "loss": 1.1113, "step": 30924 }, { "epoch": 0.93, "learning_rate": 6.106617057942077e-08, "loss": 1.0195, "step": 30925 }, { "epoch": 0.93, "learning_rate": 6.101259950773347e-08, "loss": 1.0983, "step": 30926 }, { "epoch": 0.93, "learning_rate": 6.095905165403204e-08, "loss": 0.9696, "step": 30927 }, { "epoch": 0.93, "learning_rate": 6.090552701882551e-08, "loss": 1.0118, "step": 30928 }, { "epoch": 0.93, "learning_rate": 6.085202560262349e-08, "loss": 1.1288, "step": 30929 }, { "epoch": 0.93, "learning_rate": 6.079854740593555e-08, "loss": 1.0632, "step": 30930 }, { "epoch": 0.93, "learning_rate": 6.074509242927101e-08, "loss": 1.0461, "step": 30931 }, { "epoch": 0.93, "learning_rate": 6.069166067313808e-08, "loss": 1.1617, "step": 30932 }, { "epoch": 0.93, "learning_rate": 6.063825213804553e-08, "loss": 1.0812, "step": 30933 }, { "epoch": 0.93, "learning_rate": 6.05848668245021e-08, "loss": 0.9465, "step": 30934 }, { "epoch": 0.93, "learning_rate": 6.0531504733016e-08, "loss": 0.9752, "step": 30935 }, { "epoch": 0.93, "learning_rate": 6.047816586409517e-08, "loss": 1.073, "step": 30936 }, { "epoch": 0.93, "learning_rate": 6.042485021824696e-08, "loss": 1.1833, "step": 30937 }, { "epoch": 0.93, "learning_rate": 6.037155779597959e-08, "loss": 1.0445, "step": 30938 }, { "epoch": 0.93, "learning_rate": 6.031828859779987e-08, "loss": 1.1072, "step": 30939 }, { "epoch": 0.93, "learning_rate": 6.026504262421517e-08, "loss": 1.0637, "step": 30940 }, { "epoch": 0.93, "learning_rate": 6.021181987573205e-08, "loss": 1.0046, "step": 30941 }, { "epoch": 0.93, "learning_rate": 6.015862035285758e-08, "loss": 1.0983, "step": 30942 }, { "epoch": 0.93, "learning_rate": 6.010544405609775e-08, "loss": 1.2784, "step": 30943 }, { "epoch": 0.93, "learning_rate": 6.005229098595938e-08, "loss": 1.0524, "step": 30944 }, { "epoch": 0.93, "learning_rate": 5.999916114294763e-08, "loss": 1.1776, "step": 30945 }, { "epoch": 0.93, "learning_rate": 5.994605452756902e-08, "loss": 1.0074, "step": 30946 }, { "epoch": 0.93, "learning_rate": 5.989297114032871e-08, "loss": 1.0896, "step": 30947 }, { "epoch": 0.93, "learning_rate": 5.983991098173214e-08, "loss": 1.1061, "step": 30948 }, { "epoch": 0.93, "learning_rate": 5.978687405228444e-08, "loss": 1.1756, "step": 30949 }, { "epoch": 0.93, "learning_rate": 5.973386035249024e-08, "loss": 1.164, "step": 30950 }, { "epoch": 0.93, "learning_rate": 5.968086988285465e-08, "loss": 1.0497, "step": 30951 }, { "epoch": 0.93, "learning_rate": 5.962790264388174e-08, "loss": 1.0189, "step": 30952 }, { "epoch": 0.93, "learning_rate": 5.95749586360761e-08, "loss": 1.1367, "step": 30953 }, { "epoch": 0.93, "learning_rate": 5.9522037859941204e-08, "loss": 1.0998, "step": 30954 }, { "epoch": 0.93, "learning_rate": 5.946914031598111e-08, "loss": 1.2452, "step": 30955 }, { "epoch": 0.93, "learning_rate": 5.9416266004699577e-08, "loss": 1.118, "step": 30956 }, { "epoch": 0.93, "learning_rate": 5.936341492659981e-08, "loss": 1.0687, "step": 30957 }, { "epoch": 0.93, "learning_rate": 5.931058708218473e-08, "loss": 1.0703, "step": 30958 }, { "epoch": 0.93, "learning_rate": 5.925778247195757e-08, "loss": 1.1603, "step": 30959 }, { "epoch": 0.93, "learning_rate": 5.920500109642069e-08, "loss": 1.1653, "step": 30960 }, { "epoch": 0.93, "learning_rate": 5.9152242956076465e-08, "loss": 1.0251, "step": 30961 }, { "epoch": 0.93, "learning_rate": 5.909950805142783e-08, "loss": 0.9598, "step": 30962 }, { "epoch": 0.93, "learning_rate": 5.9046796382976054e-08, "loss": 1.0497, "step": 30963 }, { "epoch": 0.93, "learning_rate": 5.899410795122296e-08, "loss": 1.0797, "step": 30964 }, { "epoch": 0.93, "learning_rate": 5.8941442756670354e-08, "loss": 1.09, "step": 30965 }, { "epoch": 0.93, "learning_rate": 5.888880079981979e-08, "loss": 1.1602, "step": 30966 }, { "epoch": 0.93, "learning_rate": 5.883618208117198e-08, "loss": 1.111, "step": 30967 }, { "epoch": 0.93, "learning_rate": 5.878358660122818e-08, "loss": 1.0403, "step": 30968 }, { "epoch": 0.93, "learning_rate": 5.8731014360488834e-08, "loss": 1.1771, "step": 30969 }, { "epoch": 0.93, "learning_rate": 5.867846535945465e-08, "loss": 1.1031, "step": 30970 }, { "epoch": 0.93, "learning_rate": 5.86259395986255e-08, "loss": 1.0783, "step": 30971 }, { "epoch": 0.93, "learning_rate": 5.857343707850155e-08, "loss": 1.1238, "step": 30972 }, { "epoch": 0.93, "learning_rate": 5.8520957799582666e-08, "loss": 1.1032, "step": 30973 }, { "epoch": 0.93, "learning_rate": 5.846850176236874e-08, "loss": 1.0682, "step": 30974 }, { "epoch": 0.93, "learning_rate": 5.841606896735852e-08, "loss": 1.1255, "step": 30975 }, { "epoch": 0.93, "learning_rate": 5.8363659415051345e-08, "loss": 1.0807, "step": 30976 }, { "epoch": 0.93, "learning_rate": 5.8311273105946255e-08, "loss": 1.0077, "step": 30977 }, { "epoch": 0.93, "learning_rate": 5.825891004054174e-08, "loss": 1.0784, "step": 30978 }, { "epoch": 0.93, "learning_rate": 5.820657021933685e-08, "loss": 1.0859, "step": 30979 }, { "epoch": 0.93, "learning_rate": 5.815425364282895e-08, "loss": 1.1349, "step": 30980 }, { "epoch": 0.93, "learning_rate": 5.810196031151683e-08, "loss": 0.9949, "step": 30981 }, { "epoch": 0.93, "learning_rate": 5.8049690225897845e-08, "loss": 1.0942, "step": 30982 }, { "epoch": 0.93, "learning_rate": 5.799744338646995e-08, "loss": 1.0535, "step": 30983 }, { "epoch": 0.93, "learning_rate": 5.7945219793729965e-08, "loss": 1.0581, "step": 30984 }, { "epoch": 0.93, "learning_rate": 5.7893019448175545e-08, "loss": 1.1306, "step": 30985 }, { "epoch": 0.93, "learning_rate": 5.784084235030324e-08, "loss": 1.0345, "step": 30986 }, { "epoch": 0.93, "learning_rate": 5.7788688500610145e-08, "loss": 1.1368, "step": 30987 }, { "epoch": 0.93, "learning_rate": 5.7736557899592537e-08, "loss": 1.0134, "step": 30988 }, { "epoch": 0.93, "learning_rate": 5.768445054774641e-08, "loss": 1.0534, "step": 30989 }, { "epoch": 0.93, "learning_rate": 5.7632366445568024e-08, "loss": 1.1521, "step": 30990 }, { "epoch": 0.93, "learning_rate": 5.758030559355338e-08, "loss": 1.1238, "step": 30991 }, { "epoch": 0.93, "learning_rate": 5.7528267992197904e-08, "loss": 1.1274, "step": 30992 }, { "epoch": 0.93, "learning_rate": 5.747625364199705e-08, "loss": 1.0156, "step": 30993 }, { "epoch": 0.93, "learning_rate": 5.742426254344569e-08, "loss": 1.0529, "step": 30994 }, { "epoch": 0.93, "learning_rate": 5.7372294697039255e-08, "loss": 1.0521, "step": 30995 }, { "epoch": 0.93, "learning_rate": 5.732035010327208e-08, "loss": 1.0987, "step": 30996 }, { "epoch": 0.93, "learning_rate": 5.726842876263877e-08, "loss": 1.1135, "step": 30997 }, { "epoch": 0.93, "learning_rate": 5.721653067563337e-08, "loss": 1.138, "step": 30998 }, { "epoch": 0.93, "learning_rate": 5.716465584275022e-08, "loss": 1.1522, "step": 30999 }, { "epoch": 0.93, "learning_rate": 5.7112804264483345e-08, "loss": 1.081, "step": 31000 }, { "epoch": 0.93, "learning_rate": 5.70609759413257e-08, "loss": 1.0541, "step": 31001 }, { "epoch": 0.93, "learning_rate": 5.700917087377106e-08, "loss": 1.1306, "step": 31002 }, { "epoch": 0.93, "learning_rate": 5.695738906231235e-08, "loss": 1.1525, "step": 31003 }, { "epoch": 0.93, "learning_rate": 5.69056305074428e-08, "loss": 1.1094, "step": 31004 }, { "epoch": 0.93, "learning_rate": 5.685389520965534e-08, "loss": 1.1109, "step": 31005 }, { "epoch": 0.93, "learning_rate": 5.6802183169441804e-08, "loss": 1.0854, "step": 31006 }, { "epoch": 0.93, "learning_rate": 5.675049438729485e-08, "loss": 1.0549, "step": 31007 }, { "epoch": 0.93, "learning_rate": 5.669882886370631e-08, "loss": 1.1214, "step": 31008 }, { "epoch": 0.93, "learning_rate": 5.664718659916857e-08, "loss": 1.0465, "step": 31009 }, { "epoch": 0.93, "learning_rate": 5.659556759417262e-08, "loss": 1.0067, "step": 31010 }, { "epoch": 0.93, "learning_rate": 5.654397184921001e-08, "loss": 1.0523, "step": 31011 }, { "epoch": 0.93, "learning_rate": 5.6492399364772024e-08, "loss": 1.0923, "step": 31012 }, { "epoch": 0.93, "learning_rate": 5.644085014134992e-08, "loss": 1.1244, "step": 31013 }, { "epoch": 0.93, "learning_rate": 5.638932417943388e-08, "loss": 1.0625, "step": 31014 }, { "epoch": 0.93, "learning_rate": 5.6337821479514335e-08, "loss": 1.0118, "step": 31015 }, { "epoch": 0.93, "learning_rate": 5.6286342042082e-08, "loss": 1.2158, "step": 31016 }, { "epoch": 0.93, "learning_rate": 5.623488586762649e-08, "loss": 1.1586, "step": 31017 }, { "epoch": 0.93, "learning_rate": 5.618345295663824e-08, "loss": 1.0418, "step": 31018 }, { "epoch": 0.93, "learning_rate": 5.613204330960631e-08, "loss": 1.005, "step": 31019 }, { "epoch": 0.93, "learning_rate": 5.608065692702031e-08, "loss": 1.1562, "step": 31020 }, { "epoch": 0.93, "learning_rate": 5.602929380936956e-08, "loss": 1.0735, "step": 31021 }, { "epoch": 0.93, "learning_rate": 5.5977953957143116e-08, "loss": 1.1331, "step": 31022 }, { "epoch": 0.93, "learning_rate": 5.5926637370829206e-08, "loss": 1.0203, "step": 31023 }, { "epoch": 0.93, "learning_rate": 5.58753440509166e-08, "loss": 1.1042, "step": 31024 }, { "epoch": 0.93, "learning_rate": 5.582407399789352e-08, "loss": 1.0464, "step": 31025 }, { "epoch": 0.93, "learning_rate": 5.577282721224847e-08, "loss": 1.1485, "step": 31026 }, { "epoch": 0.93, "learning_rate": 5.572160369446855e-08, "loss": 1.0877, "step": 31027 }, { "epoch": 0.93, "learning_rate": 5.567040344504171e-08, "loss": 1.0238, "step": 31028 }, { "epoch": 0.93, "learning_rate": 5.561922646445561e-08, "loss": 1.0778, "step": 31029 }, { "epoch": 0.93, "learning_rate": 5.556807275319709e-08, "loss": 1.0834, "step": 31030 }, { "epoch": 0.93, "learning_rate": 5.551694231175353e-08, "loss": 1.1578, "step": 31031 }, { "epoch": 0.93, "learning_rate": 5.5465835140610936e-08, "loss": 1.1484, "step": 31032 }, { "epoch": 0.93, "learning_rate": 5.5414751240256416e-08, "loss": 1.0652, "step": 31033 }, { "epoch": 0.93, "learning_rate": 5.5363690611176245e-08, "loss": 1.0815, "step": 31034 }, { "epoch": 0.93, "learning_rate": 5.531265325385643e-08, "loss": 1.2014, "step": 31035 }, { "epoch": 0.93, "learning_rate": 5.5261639168782686e-08, "loss": 1.0997, "step": 31036 }, { "epoch": 0.93, "learning_rate": 5.521064835644047e-08, "loss": 1.1891, "step": 31037 }, { "epoch": 0.94, "learning_rate": 5.515968081731549e-08, "loss": 1.1257, "step": 31038 }, { "epoch": 0.94, "learning_rate": 5.5108736551893193e-08, "loss": 1.1855, "step": 31039 }, { "epoch": 0.94, "learning_rate": 5.50578155606582e-08, "loss": 1.0293, "step": 31040 }, { "epoch": 0.94, "learning_rate": 5.500691784409484e-08, "loss": 1.0103, "step": 31041 }, { "epoch": 0.94, "learning_rate": 5.495604340268829e-08, "loss": 1.0809, "step": 31042 }, { "epoch": 0.94, "learning_rate": 5.490519223692259e-08, "loss": 0.9029, "step": 31043 }, { "epoch": 0.94, "learning_rate": 5.4854364347282085e-08, "loss": 1.1344, "step": 31044 }, { "epoch": 0.94, "learning_rate": 5.480355973425028e-08, "loss": 0.9663, "step": 31045 }, { "epoch": 0.94, "learning_rate": 5.4752778398310946e-08, "loss": 1.2206, "step": 31046 }, { "epoch": 0.94, "learning_rate": 5.470202033994731e-08, "loss": 1.0612, "step": 31047 }, { "epoch": 0.94, "learning_rate": 5.4651285559642886e-08, "loss": 0.8832, "step": 31048 }, { "epoch": 0.94, "learning_rate": 5.4600574057880604e-08, "loss": 1.1361, "step": 31049 }, { "epoch": 0.94, "learning_rate": 5.454988583514287e-08, "loss": 1.1545, "step": 31050 }, { "epoch": 0.94, "learning_rate": 5.449922089191262e-08, "loss": 1.0818, "step": 31051 }, { "epoch": 0.94, "learning_rate": 5.444857922867225e-08, "loss": 1.0177, "step": 31052 }, { "epoch": 0.94, "learning_rate": 5.439796084590332e-08, "loss": 1.0134, "step": 31053 }, { "epoch": 0.94, "learning_rate": 5.434736574408794e-08, "loss": 1.0406, "step": 31054 }, { "epoch": 0.94, "learning_rate": 5.429679392370768e-08, "loss": 1.0549, "step": 31055 }, { "epoch": 0.94, "learning_rate": 5.424624538524409e-08, "loss": 1.1595, "step": 31056 }, { "epoch": 0.94, "learning_rate": 5.4195720129178455e-08, "loss": 1.1266, "step": 31057 }, { "epoch": 0.94, "learning_rate": 5.4145218155991774e-08, "loss": 1.1585, "step": 31058 }, { "epoch": 0.94, "learning_rate": 5.409473946616423e-08, "loss": 1.1031, "step": 31059 }, { "epoch": 0.94, "learning_rate": 5.404428406017709e-08, "loss": 1.0515, "step": 31060 }, { "epoch": 0.94, "learning_rate": 5.399385193851026e-08, "loss": 1.2819, "step": 31061 }, { "epoch": 0.94, "learning_rate": 5.39434431016439e-08, "loss": 1.072, "step": 31062 }, { "epoch": 0.94, "learning_rate": 5.3893057550057915e-08, "loss": 1.0392, "step": 31063 }, { "epoch": 0.94, "learning_rate": 5.384269528423192e-08, "loss": 1.2041, "step": 31064 }, { "epoch": 0.94, "learning_rate": 5.379235630464552e-08, "loss": 1.1093, "step": 31065 }, { "epoch": 0.94, "learning_rate": 5.374204061177751e-08, "loss": 0.9891, "step": 31066 }, { "epoch": 0.94, "learning_rate": 5.369174820610723e-08, "loss": 1.1615, "step": 31067 }, { "epoch": 0.94, "learning_rate": 5.364147908811346e-08, "loss": 1.0382, "step": 31068 }, { "epoch": 0.94, "learning_rate": 5.359123325827442e-08, "loss": 1.0294, "step": 31069 }, { "epoch": 0.94, "learning_rate": 5.354101071706863e-08, "loss": 1.1403, "step": 31070 }, { "epoch": 0.94, "learning_rate": 5.349081146497431e-08, "loss": 1.0068, "step": 31071 }, { "epoch": 0.94, "learning_rate": 5.3440635502468866e-08, "loss": 1.1085, "step": 31072 }, { "epoch": 0.94, "learning_rate": 5.339048283003051e-08, "loss": 1.1243, "step": 31073 }, { "epoch": 0.94, "learning_rate": 5.334035344813637e-08, "loss": 1.0619, "step": 31074 }, { "epoch": 0.94, "learning_rate": 5.329024735726357e-08, "loss": 1.2241, "step": 31075 }, { "epoch": 0.94, "learning_rate": 5.3240164557889494e-08, "loss": 1.0836, "step": 31076 }, { "epoch": 0.94, "learning_rate": 5.3190105050490435e-08, "loss": 1.0591, "step": 31077 }, { "epoch": 0.94, "learning_rate": 5.3140068835543514e-08, "loss": 1.0876, "step": 31078 }, { "epoch": 0.94, "learning_rate": 5.3090055913524175e-08, "loss": 1.1411, "step": 31079 }, { "epoch": 0.94, "learning_rate": 5.3040066284909264e-08, "loss": 1.2538, "step": 31080 }, { "epoch": 0.94, "learning_rate": 5.299009995017451e-08, "loss": 1.2189, "step": 31081 }, { "epoch": 0.94, "learning_rate": 5.2940156909795646e-08, "loss": 1.0954, "step": 31082 }, { "epoch": 0.94, "learning_rate": 5.289023716424757e-08, "loss": 1.1189, "step": 31083 }, { "epoch": 0.94, "learning_rate": 5.284034071400601e-08, "loss": 1.0424, "step": 31084 }, { "epoch": 0.94, "learning_rate": 5.279046755954587e-08, "loss": 1.19, "step": 31085 }, { "epoch": 0.94, "learning_rate": 5.2740617701341754e-08, "loss": 1.0423, "step": 31086 }, { "epoch": 0.94, "learning_rate": 5.269079113986858e-08, "loss": 1.1532, "step": 31087 }, { "epoch": 0.94, "learning_rate": 5.2640987875600127e-08, "loss": 1.0822, "step": 31088 }, { "epoch": 0.94, "learning_rate": 5.259120790901101e-08, "loss": 0.9902, "step": 31089 }, { "epoch": 0.94, "learning_rate": 5.254145124057447e-08, "loss": 1.0452, "step": 31090 }, { "epoch": 0.94, "learning_rate": 5.2491717870765127e-08, "loss": 1.1678, "step": 31091 }, { "epoch": 0.94, "learning_rate": 5.244200780005565e-08, "loss": 1.1803, "step": 31092 }, { "epoch": 0.94, "learning_rate": 5.2392321028919276e-08, "loss": 1.2394, "step": 31093 }, { "epoch": 0.94, "learning_rate": 5.2342657557829245e-08, "loss": 1.3077, "step": 31094 }, { "epoch": 0.94, "learning_rate": 5.2293017387258506e-08, "loss": 1.0294, "step": 31095 }, { "epoch": 0.94, "learning_rate": 5.2243400517679176e-08, "loss": 1.0469, "step": 31096 }, { "epoch": 0.94, "learning_rate": 5.219380694956394e-08, "loss": 1.1168, "step": 31097 }, { "epoch": 0.94, "learning_rate": 5.214423668338464e-08, "loss": 1.1254, "step": 31098 }, { "epoch": 0.94, "learning_rate": 5.20946897196134e-08, "loss": 1.1139, "step": 31099 }, { "epoch": 0.94, "learning_rate": 5.2045166058721506e-08, "loss": 1.1007, "step": 31100 }, { "epoch": 0.94, "learning_rate": 5.199566570118081e-08, "loss": 1.1196, "step": 31101 }, { "epoch": 0.94, "learning_rate": 5.194618864746231e-08, "loss": 1.0652, "step": 31102 }, { "epoch": 0.94, "learning_rate": 5.1896734898037313e-08, "loss": 1.0381, "step": 31103 }, { "epoch": 0.94, "learning_rate": 5.184730445337627e-08, "loss": 1.0577, "step": 31104 }, { "epoch": 0.94, "learning_rate": 5.179789731394963e-08, "loss": 1.0853, "step": 31105 }, { "epoch": 0.94, "learning_rate": 5.174851348022814e-08, "loss": 1.1501, "step": 31106 }, { "epoch": 0.94, "learning_rate": 5.169915295268141e-08, "loss": 1.0825, "step": 31107 }, { "epoch": 0.94, "learning_rate": 5.1649815731780185e-08, "loss": 1.0579, "step": 31108 }, { "epoch": 0.94, "learning_rate": 5.1600501817992975e-08, "loss": 1.1053, "step": 31109 }, { "epoch": 0.94, "learning_rate": 5.155121121178996e-08, "loss": 1.1082, "step": 31110 }, { "epoch": 0.94, "learning_rate": 5.1501943913640215e-08, "loss": 1.215, "step": 31111 }, { "epoch": 0.94, "learning_rate": 5.145269992401253e-08, "loss": 1.1609, "step": 31112 }, { "epoch": 0.94, "learning_rate": 5.140347924337624e-08, "loss": 1.0209, "step": 31113 }, { "epoch": 0.94, "learning_rate": 5.135428187219932e-08, "loss": 1.1258, "step": 31114 }, { "epoch": 0.94, "learning_rate": 5.130510781095027e-08, "loss": 1.0991, "step": 31115 }, { "epoch": 0.94, "learning_rate": 5.125595706009734e-08, "loss": 1.1084, "step": 31116 }, { "epoch": 0.94, "learning_rate": 5.1206829620108756e-08, "loss": 1.0601, "step": 31117 }, { "epoch": 0.94, "learning_rate": 5.115772549145109e-08, "loss": 1.207, "step": 31118 }, { "epoch": 0.94, "learning_rate": 5.1108644674592865e-08, "loss": 1.1276, "step": 31119 }, { "epoch": 0.94, "learning_rate": 5.1059587170000643e-08, "loss": 1.0524, "step": 31120 }, { "epoch": 0.94, "learning_rate": 5.1010552978142115e-08, "loss": 1.022, "step": 31121 }, { "epoch": 0.94, "learning_rate": 5.0961542099483566e-08, "loss": 1.1374, "step": 31122 }, { "epoch": 0.94, "learning_rate": 5.091255453449129e-08, "loss": 1.0974, "step": 31123 }, { "epoch": 0.94, "learning_rate": 5.086359028363214e-08, "loss": 1.0881, "step": 31124 }, { "epoch": 0.94, "learning_rate": 5.081464934737212e-08, "loss": 1.0531, "step": 31125 }, { "epoch": 0.94, "learning_rate": 5.076573172617699e-08, "loss": 0.9929, "step": 31126 }, { "epoch": 0.94, "learning_rate": 5.071683742051276e-08, "loss": 1.0683, "step": 31127 }, { "epoch": 0.94, "learning_rate": 5.066796643084432e-08, "loss": 1.0262, "step": 31128 }, { "epoch": 0.94, "learning_rate": 5.061911875763742e-08, "loss": 1.0282, "step": 31129 }, { "epoch": 0.94, "learning_rate": 5.057029440135669e-08, "loss": 1.2625, "step": 31130 }, { "epoch": 0.94, "learning_rate": 5.052149336246703e-08, "loss": 1.3263, "step": 31131 }, { "epoch": 0.94, "learning_rate": 5.047271564143308e-08, "loss": 1.1345, "step": 31132 }, { "epoch": 0.94, "learning_rate": 5.0423961238719176e-08, "loss": 1.0199, "step": 31133 }, { "epoch": 0.94, "learning_rate": 5.03752301547894e-08, "loss": 1.0353, "step": 31134 }, { "epoch": 0.94, "learning_rate": 5.0326522390107824e-08, "loss": 1.0329, "step": 31135 }, { "epoch": 0.94, "learning_rate": 5.0277837945137686e-08, "loss": 1.1529, "step": 31136 }, { "epoch": 0.94, "learning_rate": 5.022917682034278e-08, "loss": 1.1545, "step": 31137 }, { "epoch": 0.94, "learning_rate": 5.018053901618608e-08, "loss": 1.0399, "step": 31138 }, { "epoch": 0.94, "learning_rate": 5.013192453313137e-08, "loss": 1.1963, "step": 31139 }, { "epoch": 0.94, "learning_rate": 5.008333337164023e-08, "loss": 1.1018, "step": 31140 }, { "epoch": 0.94, "learning_rate": 5.0034765532176175e-08, "loss": 1.1278, "step": 31141 }, { "epoch": 0.94, "learning_rate": 4.998622101520106e-08, "loss": 1.1154, "step": 31142 }, { "epoch": 0.94, "learning_rate": 4.99376998211773e-08, "loss": 1.0778, "step": 31143 }, { "epoch": 0.94, "learning_rate": 4.988920195056646e-08, "loss": 1.1832, "step": 31144 }, { "epoch": 0.94, "learning_rate": 4.984072740383067e-08, "loss": 1.0897, "step": 31145 }, { "epoch": 0.94, "learning_rate": 4.9792276181430674e-08, "loss": 1.0574, "step": 31146 }, { "epoch": 0.94, "learning_rate": 4.9743848283828614e-08, "loss": 1.0637, "step": 31147 }, { "epoch": 0.94, "learning_rate": 4.969544371148494e-08, "loss": 1.0944, "step": 31148 }, { "epoch": 0.94, "learning_rate": 4.96470624648604e-08, "loss": 1.1286, "step": 31149 }, { "epoch": 0.94, "learning_rate": 4.9598704544415734e-08, "loss": 1.158, "step": 31150 }, { "epoch": 0.94, "learning_rate": 4.955036995061113e-08, "loss": 1.0381, "step": 31151 }, { "epoch": 0.94, "learning_rate": 4.950205868390706e-08, "loss": 1.1075, "step": 31152 }, { "epoch": 0.94, "learning_rate": 4.945377074476288e-08, "loss": 1.1301, "step": 31153 }, { "epoch": 0.94, "learning_rate": 4.940550613363876e-08, "loss": 1.1122, "step": 31154 }, { "epoch": 0.94, "learning_rate": 4.935726485099407e-08, "loss": 1.0625, "step": 31155 }, { "epoch": 0.94, "learning_rate": 4.9309046897287885e-08, "loss": 1.0302, "step": 31156 }, { "epoch": 0.94, "learning_rate": 4.9260852272979e-08, "loss": 1.2113, "step": 31157 }, { "epoch": 0.94, "learning_rate": 4.9212680978526775e-08, "loss": 0.9841, "step": 31158 }, { "epoch": 0.94, "learning_rate": 4.9164533014389446e-08, "loss": 1.038, "step": 31159 }, { "epoch": 0.94, "learning_rate": 4.911640838102555e-08, "loss": 1.0846, "step": 31160 }, { "epoch": 0.94, "learning_rate": 4.906830707889276e-08, "loss": 1.1135, "step": 31161 }, { "epoch": 0.94, "learning_rate": 4.9020229108449614e-08, "loss": 1.2138, "step": 31162 }, { "epoch": 0.94, "learning_rate": 4.8972174470153233e-08, "loss": 1.069, "step": 31163 }, { "epoch": 0.94, "learning_rate": 4.892414316446103e-08, "loss": 1.0817, "step": 31164 }, { "epoch": 0.94, "learning_rate": 4.8876135191830986e-08, "loss": 1.1464, "step": 31165 }, { "epoch": 0.94, "learning_rate": 4.8828150552719664e-08, "loss": 1.0754, "step": 31166 }, { "epoch": 0.94, "learning_rate": 4.878018924758338e-08, "loss": 1.0453, "step": 31167 }, { "epoch": 0.94, "learning_rate": 4.8732251276879526e-08, "loss": 1.0893, "step": 31168 }, { "epoch": 0.94, "learning_rate": 4.8684336641063865e-08, "loss": 1.0421, "step": 31169 }, { "epoch": 0.94, "learning_rate": 4.863644534059297e-08, "loss": 1.0302, "step": 31170 }, { "epoch": 0.94, "learning_rate": 4.858857737592204e-08, "loss": 0.9835, "step": 31171 }, { "epoch": 0.94, "learning_rate": 4.8540732747507646e-08, "loss": 1.0737, "step": 31172 }, { "epoch": 0.94, "learning_rate": 4.8492911455804705e-08, "loss": 1.1385, "step": 31173 }, { "epoch": 0.94, "learning_rate": 4.84451135012684e-08, "loss": 1.1899, "step": 31174 }, { "epoch": 0.94, "learning_rate": 4.839733888435422e-08, "loss": 1.0612, "step": 31175 }, { "epoch": 0.94, "learning_rate": 4.834958760551622e-08, "loss": 1.0054, "step": 31176 }, { "epoch": 0.94, "learning_rate": 4.830185966520962e-08, "loss": 1.0959, "step": 31177 }, { "epoch": 0.94, "learning_rate": 4.8254155063888753e-08, "loss": 1.0029, "step": 31178 }, { "epoch": 0.94, "learning_rate": 4.820647380200716e-08, "loss": 1.0262, "step": 31179 }, { "epoch": 0.94, "learning_rate": 4.8158815880019195e-08, "loss": 1.1901, "step": 31180 }, { "epoch": 0.94, "learning_rate": 4.811118129837838e-08, "loss": 1.0861, "step": 31181 }, { "epoch": 0.94, "learning_rate": 4.806357005753853e-08, "loss": 1.1612, "step": 31182 }, { "epoch": 0.94, "learning_rate": 4.8015982157952334e-08, "loss": 1.0166, "step": 31183 }, { "epoch": 0.94, "learning_rate": 4.7968417600073034e-08, "loss": 1.0333, "step": 31184 }, { "epoch": 0.94, "learning_rate": 4.792087638435361e-08, "loss": 1.1288, "step": 31185 }, { "epoch": 0.94, "learning_rate": 4.787335851124675e-08, "loss": 1.0948, "step": 31186 }, { "epoch": 0.94, "learning_rate": 4.782586398120431e-08, "loss": 1.045, "step": 31187 }, { "epoch": 0.94, "learning_rate": 4.777839279467844e-08, "loss": 1.1372, "step": 31188 }, { "epoch": 0.94, "learning_rate": 4.773094495212127e-08, "loss": 1.084, "step": 31189 }, { "epoch": 0.94, "learning_rate": 4.7683520453984664e-08, "loss": 1.1261, "step": 31190 }, { "epoch": 0.94, "learning_rate": 4.763611930071993e-08, "loss": 1.1431, "step": 31191 }, { "epoch": 0.94, "learning_rate": 4.758874149277809e-08, "loss": 1.1619, "step": 31192 }, { "epoch": 0.94, "learning_rate": 4.754138703061017e-08, "loss": 1.0994, "step": 31193 }, { "epoch": 0.94, "learning_rate": 4.7494055914667214e-08, "loss": 1.1068, "step": 31194 }, { "epoch": 0.94, "learning_rate": 4.7446748145399956e-08, "loss": 1.0354, "step": 31195 }, { "epoch": 0.94, "learning_rate": 4.7399463723258046e-08, "loss": 0.9132, "step": 31196 }, { "epoch": 0.94, "learning_rate": 4.7352202648692226e-08, "loss": 1.0831, "step": 31197 }, { "epoch": 0.94, "learning_rate": 4.7304964922152144e-08, "loss": 1.0203, "step": 31198 }, { "epoch": 0.94, "learning_rate": 4.725775054408771e-08, "loss": 1.1816, "step": 31199 }, { "epoch": 0.94, "learning_rate": 4.7210559514948016e-08, "loss": 1.0368, "step": 31200 }, { "epoch": 0.94, "learning_rate": 4.7163391835182426e-08, "loss": 1.0764, "step": 31201 }, { "epoch": 0.94, "learning_rate": 4.7116247505240296e-08, "loss": 1.0812, "step": 31202 }, { "epoch": 0.94, "learning_rate": 4.7069126525569885e-08, "loss": 1.002, "step": 31203 }, { "epoch": 0.94, "learning_rate": 4.702202889662027e-08, "loss": 1.0255, "step": 31204 }, { "epoch": 0.94, "learning_rate": 4.697495461883944e-08, "loss": 1.1114, "step": 31205 }, { "epoch": 0.94, "learning_rate": 4.692790369267536e-08, "loss": 1.2127, "step": 31206 }, { "epoch": 0.94, "learning_rate": 4.688087611857628e-08, "loss": 1.1181, "step": 31207 }, { "epoch": 0.94, "learning_rate": 4.68338718969899e-08, "loss": 1.1325, "step": 31208 }, { "epoch": 0.94, "learning_rate": 4.6786891028363926e-08, "loss": 1.0658, "step": 31209 }, { "epoch": 0.94, "learning_rate": 4.673993351314493e-08, "loss": 1.0656, "step": 31210 }, { "epoch": 0.94, "learning_rate": 4.6692999351780065e-08, "loss": 1.1459, "step": 31211 }, { "epoch": 0.94, "learning_rate": 4.6646088544716474e-08, "loss": 1.1519, "step": 31212 }, { "epoch": 0.94, "learning_rate": 4.659920109240046e-08, "loss": 1.1703, "step": 31213 }, { "epoch": 0.94, "learning_rate": 4.655233699527834e-08, "loss": 1.1191, "step": 31214 }, { "epoch": 0.94, "learning_rate": 4.650549625379669e-08, "loss": 1.0963, "step": 31215 }, { "epoch": 0.94, "learning_rate": 4.645867886840072e-08, "loss": 1.1439, "step": 31216 }, { "epoch": 0.94, "learning_rate": 4.6411884839536734e-08, "loss": 1.2213, "step": 31217 }, { "epoch": 0.94, "learning_rate": 4.636511416764994e-08, "loss": 1.1409, "step": 31218 }, { "epoch": 0.94, "learning_rate": 4.631836685318525e-08, "loss": 1.0439, "step": 31219 }, { "epoch": 0.94, "learning_rate": 4.6271642896588144e-08, "loss": 1.0675, "step": 31220 }, { "epoch": 0.94, "learning_rate": 4.6224942298303544e-08, "loss": 1.068, "step": 31221 }, { "epoch": 0.94, "learning_rate": 4.6178265058775266e-08, "loss": 1.1178, "step": 31222 }, { "epoch": 0.94, "learning_rate": 4.613161117844822e-08, "loss": 1.0153, "step": 31223 }, { "epoch": 0.94, "learning_rate": 4.608498065776651e-08, "loss": 1.1355, "step": 31224 }, { "epoch": 0.94, "learning_rate": 4.603837349717394e-08, "loss": 1.2032, "step": 31225 }, { "epoch": 0.94, "learning_rate": 4.599178969711404e-08, "loss": 1.0381, "step": 31226 }, { "epoch": 0.94, "learning_rate": 4.594522925803063e-08, "loss": 1.0154, "step": 31227 }, { "epoch": 0.94, "learning_rate": 4.589869218036641e-08, "loss": 1.087, "step": 31228 }, { "epoch": 0.94, "learning_rate": 4.585217846456491e-08, "loss": 1.0026, "step": 31229 }, { "epoch": 0.94, "learning_rate": 4.5805688111068836e-08, "loss": 1.0728, "step": 31230 }, { "epoch": 0.94, "learning_rate": 4.575922112032061e-08, "loss": 1.1408, "step": 31231 }, { "epoch": 0.94, "learning_rate": 4.5712777492762375e-08, "loss": 1.103, "step": 31232 }, { "epoch": 0.94, "learning_rate": 4.5666357228836557e-08, "loss": 1.085, "step": 31233 }, { "epoch": 0.94, "learning_rate": 4.5619960328985024e-08, "loss": 1.0457, "step": 31234 }, { "epoch": 0.94, "learning_rate": 4.557358679364937e-08, "loss": 1.0696, "step": 31235 }, { "epoch": 0.94, "learning_rate": 4.5527236623271185e-08, "loss": 1.1129, "step": 31236 }, { "epoch": 0.94, "learning_rate": 4.548090981829123e-08, "loss": 1.2161, "step": 31237 }, { "epoch": 0.94, "learning_rate": 4.5434606379151094e-08, "loss": 1.1505, "step": 31238 }, { "epoch": 0.94, "learning_rate": 4.538832630629125e-08, "loss": 1.0149, "step": 31239 }, { "epoch": 0.94, "learning_rate": 4.534206960015247e-08, "loss": 1.1526, "step": 31240 }, { "epoch": 0.94, "learning_rate": 4.529583626117495e-08, "loss": 1.0917, "step": 31241 }, { "epoch": 0.94, "learning_rate": 4.52496262897989e-08, "loss": 1.0804, "step": 31242 }, { "epoch": 0.94, "learning_rate": 4.5203439686464513e-08, "loss": 1.2003, "step": 31243 }, { "epoch": 0.94, "learning_rate": 4.515727645161061e-08, "loss": 1.0996, "step": 31244 }, { "epoch": 0.94, "learning_rate": 4.5111136585677116e-08, "loss": 1.153, "step": 31245 }, { "epoch": 0.94, "learning_rate": 4.5065020089103406e-08, "loss": 1.1908, "step": 31246 }, { "epoch": 0.94, "learning_rate": 4.501892696232857e-08, "loss": 1.0649, "step": 31247 }, { "epoch": 0.94, "learning_rate": 4.497285720579114e-08, "loss": 1.0878, "step": 31248 }, { "epoch": 0.94, "learning_rate": 4.492681081992939e-08, "loss": 1.1492, "step": 31249 }, { "epoch": 0.94, "learning_rate": 4.4880787805182404e-08, "loss": 1.1584, "step": 31250 }, { "epoch": 0.94, "learning_rate": 4.483478816198789e-08, "loss": 0.9988, "step": 31251 }, { "epoch": 0.94, "learning_rate": 4.478881189078354e-08, "loss": 1.0186, "step": 31252 }, { "epoch": 0.94, "learning_rate": 4.474285899200709e-08, "loss": 1.1026, "step": 31253 }, { "epoch": 0.94, "learning_rate": 4.469692946609622e-08, "loss": 1.1024, "step": 31254 }, { "epoch": 0.94, "learning_rate": 4.465102331348808e-08, "loss": 1.1566, "step": 31255 }, { "epoch": 0.94, "learning_rate": 4.460514053461984e-08, "loss": 1.1828, "step": 31256 }, { "epoch": 0.94, "learning_rate": 4.455928112992808e-08, "loss": 1.0233, "step": 31257 }, { "epoch": 0.94, "learning_rate": 4.451344509984912e-08, "loss": 1.1398, "step": 31258 }, { "epoch": 0.94, "learning_rate": 4.446763244481983e-08, "loss": 1.1013, "step": 31259 }, { "epoch": 0.94, "learning_rate": 4.442184316527598e-08, "loss": 1.1811, "step": 31260 }, { "epoch": 0.94, "learning_rate": 4.437607726165361e-08, "loss": 1.1731, "step": 31261 }, { "epoch": 0.94, "learning_rate": 4.4330334734388194e-08, "loss": 1.0253, "step": 31262 }, { "epoch": 0.94, "learning_rate": 4.428461558391523e-08, "loss": 1.135, "step": 31263 }, { "epoch": 0.94, "learning_rate": 4.423891981067019e-08, "loss": 1.0122, "step": 31264 }, { "epoch": 0.94, "learning_rate": 4.4193247415087735e-08, "loss": 1.1509, "step": 31265 }, { "epoch": 0.94, "learning_rate": 4.4147598397602795e-08, "loss": 1.0813, "step": 31266 }, { "epoch": 0.94, "learning_rate": 4.410197275865003e-08, "loss": 1.0704, "step": 31267 }, { "epoch": 0.94, "learning_rate": 4.4056370498663794e-08, "loss": 1.1455, "step": 31268 }, { "epoch": 0.94, "learning_rate": 4.401079161807792e-08, "loss": 1.3256, "step": 31269 }, { "epoch": 0.94, "learning_rate": 4.3965236117326503e-08, "loss": 1.0936, "step": 31270 }, { "epoch": 0.94, "learning_rate": 4.3919703996843086e-08, "loss": 1.032, "step": 31271 }, { "epoch": 0.94, "learning_rate": 4.387419525706122e-08, "loss": 1.0857, "step": 31272 }, { "epoch": 0.94, "learning_rate": 4.382870989841442e-08, "loss": 1.1919, "step": 31273 }, { "epoch": 0.94, "learning_rate": 4.3783247921335146e-08, "loss": 1.1711, "step": 31274 }, { "epoch": 0.94, "learning_rate": 4.373780932625638e-08, "loss": 1.0175, "step": 31275 }, { "epoch": 0.94, "learning_rate": 4.3692394113610536e-08, "loss": 0.9756, "step": 31276 }, { "epoch": 0.94, "learning_rate": 4.364700228383062e-08, "loss": 0.9615, "step": 31277 }, { "epoch": 0.94, "learning_rate": 4.360163383734767e-08, "loss": 1.1184, "step": 31278 }, { "epoch": 0.94, "learning_rate": 4.3556288774594394e-08, "loss": 1.0754, "step": 31279 }, { "epoch": 0.94, "learning_rate": 4.351096709600211e-08, "loss": 1.1011, "step": 31280 }, { "epoch": 0.94, "learning_rate": 4.3465668802002426e-08, "loss": 1.2285, "step": 31281 }, { "epoch": 0.94, "learning_rate": 4.342039389302638e-08, "loss": 1.067, "step": 31282 }, { "epoch": 0.94, "learning_rate": 4.3375142369505016e-08, "loss": 1.0364, "step": 31283 }, { "epoch": 0.94, "learning_rate": 4.3329914231869106e-08, "loss": 1.0482, "step": 31284 }, { "epoch": 0.94, "learning_rate": 4.328470948054914e-08, "loss": 1.2277, "step": 31285 }, { "epoch": 0.94, "learning_rate": 4.323952811597587e-08, "loss": 1.2116, "step": 31286 }, { "epoch": 0.94, "learning_rate": 4.3194370138578966e-08, "loss": 1.2589, "step": 31287 }, { "epoch": 0.94, "learning_rate": 4.314923554878836e-08, "loss": 1.0568, "step": 31288 }, { "epoch": 0.94, "learning_rate": 4.3104124347033706e-08, "loss": 1.0913, "step": 31289 }, { "epoch": 0.94, "learning_rate": 4.3059036533744656e-08, "loss": 1.0635, "step": 31290 }, { "epoch": 0.94, "learning_rate": 4.301397210935032e-08, "loss": 1.0334, "step": 31291 }, { "epoch": 0.94, "learning_rate": 4.2968931074279516e-08, "loss": 1.0829, "step": 31292 }, { "epoch": 0.94, "learning_rate": 4.292391342896107e-08, "loss": 1.1835, "step": 31293 }, { "epoch": 0.94, "learning_rate": 4.287891917382381e-08, "loss": 1.0854, "step": 31294 }, { "epoch": 0.94, "learning_rate": 4.283394830929544e-08, "loss": 1.1602, "step": 31295 }, { "epoch": 0.94, "learning_rate": 4.2789000835804785e-08, "loss": 0.9744, "step": 31296 }, { "epoch": 0.94, "learning_rate": 4.2744076753779285e-08, "loss": 0.984, "step": 31297 }, { "epoch": 0.94, "learning_rate": 4.269917606364693e-08, "loss": 1.1662, "step": 31298 }, { "epoch": 0.94, "learning_rate": 4.265429876583488e-08, "loss": 1.1151, "step": 31299 }, { "epoch": 0.94, "learning_rate": 4.260944486077029e-08, "loss": 0.9758, "step": 31300 }, { "epoch": 0.94, "learning_rate": 4.256461434888032e-08, "loss": 1.0085, "step": 31301 }, { "epoch": 0.94, "learning_rate": 4.251980723059185e-08, "loss": 1.098, "step": 31302 }, { "epoch": 0.94, "learning_rate": 4.24750235063312e-08, "loss": 1.0565, "step": 31303 }, { "epoch": 0.94, "learning_rate": 4.243026317652443e-08, "loss": 1.0532, "step": 31304 }, { "epoch": 0.94, "learning_rate": 4.238552624159814e-08, "loss": 1.1089, "step": 31305 }, { "epoch": 0.94, "learning_rate": 4.234081270197809e-08, "loss": 1.0342, "step": 31306 }, { "epoch": 0.94, "learning_rate": 4.229612255809007e-08, "loss": 1.1265, "step": 31307 }, { "epoch": 0.94, "learning_rate": 4.2251455810358997e-08, "loss": 1.129, "step": 31308 }, { "epoch": 0.94, "learning_rate": 4.22068124592101e-08, "loss": 1.0989, "step": 31309 }, { "epoch": 0.94, "learning_rate": 4.2162192505068864e-08, "loss": 0.9583, "step": 31310 }, { "epoch": 0.94, "learning_rate": 4.211759594835996e-08, "loss": 1.1216, "step": 31311 }, { "epoch": 0.94, "learning_rate": 4.207302278950775e-08, "loss": 1.1327, "step": 31312 }, { "epoch": 0.94, "learning_rate": 4.2028473028936643e-08, "loss": 1.1193, "step": 31313 }, { "epoch": 0.94, "learning_rate": 4.198394666707045e-08, "loss": 1.0151, "step": 31314 }, { "epoch": 0.94, "learning_rate": 4.193944370433328e-08, "loss": 0.9839, "step": 31315 }, { "epoch": 0.94, "learning_rate": 4.189496414114924e-08, "loss": 1.1621, "step": 31316 }, { "epoch": 0.94, "learning_rate": 4.185050797794077e-08, "loss": 1.176, "step": 31317 }, { "epoch": 0.94, "learning_rate": 4.180607521513169e-08, "loss": 1.1147, "step": 31318 }, { "epoch": 0.94, "learning_rate": 4.176166585314473e-08, "loss": 1.215, "step": 31319 }, { "epoch": 0.94, "learning_rate": 4.171727989240315e-08, "loss": 1.1414, "step": 31320 }, { "epoch": 0.94, "learning_rate": 4.167291733332884e-08, "loss": 1.1193, "step": 31321 }, { "epoch": 0.94, "learning_rate": 4.1628578176344245e-08, "loss": 1.1041, "step": 31322 }, { "epoch": 0.94, "learning_rate": 4.15842624218718e-08, "loss": 1.1902, "step": 31323 }, { "epoch": 0.94, "learning_rate": 4.153997007033311e-08, "loss": 1.1364, "step": 31324 }, { "epoch": 0.94, "learning_rate": 4.149570112215007e-08, "loss": 1.1775, "step": 31325 }, { "epoch": 0.94, "learning_rate": 4.145145557774372e-08, "loss": 1.0377, "step": 31326 }, { "epoch": 0.94, "learning_rate": 4.1407233437535385e-08, "loss": 1.1279, "step": 31327 }, { "epoch": 0.94, "learning_rate": 4.136303470194614e-08, "loss": 1.0129, "step": 31328 }, { "epoch": 0.94, "learning_rate": 4.1318859371397013e-08, "loss": 1.0568, "step": 31329 }, { "epoch": 0.94, "learning_rate": 4.127470744630796e-08, "loss": 1.0911, "step": 31330 }, { "epoch": 0.94, "learning_rate": 4.1230578927099476e-08, "loss": 1.1592, "step": 31331 }, { "epoch": 0.94, "learning_rate": 4.11864738141915e-08, "loss": 1.0704, "step": 31332 }, { "epoch": 0.94, "learning_rate": 4.114239210800453e-08, "loss": 1.0629, "step": 31333 }, { "epoch": 0.94, "learning_rate": 4.109833380895739e-08, "loss": 0.9832, "step": 31334 }, { "epoch": 0.94, "learning_rate": 4.105429891747004e-08, "loss": 1.1495, "step": 31335 }, { "epoch": 0.94, "learning_rate": 4.101028743396129e-08, "loss": 1.0892, "step": 31336 }, { "epoch": 0.94, "learning_rate": 4.096629935885055e-08, "loss": 1.0971, "step": 31337 }, { "epoch": 0.94, "learning_rate": 4.0922334692556354e-08, "loss": 1.1543, "step": 31338 }, { "epoch": 0.94, "learning_rate": 4.087839343549699e-08, "loss": 1.072, "step": 31339 }, { "epoch": 0.94, "learning_rate": 4.083447558809101e-08, "loss": 1.0246, "step": 31340 }, { "epoch": 0.94, "learning_rate": 4.079058115075668e-08, "loss": 1.013, "step": 31341 }, { "epoch": 0.94, "learning_rate": 4.074671012391146e-08, "loss": 1.1265, "step": 31342 }, { "epoch": 0.94, "learning_rate": 4.070286250797306e-08, "loss": 1.1382, "step": 31343 }, { "epoch": 0.94, "learning_rate": 4.065903830335921e-08, "loss": 1.2777, "step": 31344 }, { "epoch": 0.94, "learning_rate": 4.061523751048652e-08, "loss": 1.0224, "step": 31345 }, { "epoch": 0.94, "learning_rate": 4.057146012977242e-08, "loss": 1.0649, "step": 31346 }, { "epoch": 0.94, "learning_rate": 4.052770616163354e-08, "loss": 1.0198, "step": 31347 }, { "epoch": 0.94, "learning_rate": 4.048397560648648e-08, "loss": 1.1261, "step": 31348 }, { "epoch": 0.94, "learning_rate": 4.04402684647473e-08, "loss": 1.0787, "step": 31349 }, { "epoch": 0.94, "learning_rate": 4.0396584736832056e-08, "loss": 1.1408, "step": 31350 }, { "epoch": 0.94, "learning_rate": 4.035292442315708e-08, "loss": 1.1876, "step": 31351 }, { "epoch": 0.94, "learning_rate": 4.03092875241376e-08, "loss": 1.0984, "step": 31352 }, { "epoch": 0.94, "learning_rate": 4.026567404018883e-08, "loss": 1.0383, "step": 31353 }, { "epoch": 0.94, "learning_rate": 4.022208397172628e-08, "loss": 1.0381, "step": 31354 }, { "epoch": 0.94, "learning_rate": 4.0178517319165165e-08, "loss": 1.1395, "step": 31355 }, { "epoch": 0.94, "learning_rate": 4.013497408291961e-08, "loss": 1.108, "step": 31356 }, { "epoch": 0.94, "learning_rate": 4.0091454263404275e-08, "loss": 1.0692, "step": 31357 }, { "epoch": 0.94, "learning_rate": 4.004795786103355e-08, "loss": 1.0345, "step": 31358 }, { "epoch": 0.94, "learning_rate": 4.000448487622183e-08, "loss": 1.0493, "step": 31359 }, { "epoch": 0.94, "learning_rate": 3.996103530938239e-08, "loss": 1.0765, "step": 31360 }, { "epoch": 0.94, "learning_rate": 3.991760916092907e-08, "loss": 1.0995, "step": 31361 }, { "epoch": 0.94, "learning_rate": 3.987420643127543e-08, "loss": 1.0628, "step": 31362 }, { "epoch": 0.94, "learning_rate": 3.9830827120834195e-08, "loss": 1.0678, "step": 31363 }, { "epoch": 0.94, "learning_rate": 3.9787471230019194e-08, "loss": 1.0503, "step": 31364 }, { "epoch": 0.94, "learning_rate": 3.9744138759242045e-08, "loss": 1.0739, "step": 31365 }, { "epoch": 0.94, "learning_rate": 3.9700829708916034e-08, "loss": 1.1252, "step": 31366 }, { "epoch": 0.94, "learning_rate": 3.965754407945332e-08, "loss": 1.0014, "step": 31367 }, { "epoch": 0.94, "learning_rate": 3.961428187126581e-08, "loss": 1.1695, "step": 31368 }, { "epoch": 0.94, "learning_rate": 3.9571043084765116e-08, "loss": 0.967, "step": 31369 }, { "epoch": 0.95, "learning_rate": 3.95278277203634e-08, "loss": 1.0688, "step": 31370 }, { "epoch": 0.95, "learning_rate": 3.9484635778471446e-08, "loss": 1.0146, "step": 31371 }, { "epoch": 0.95, "learning_rate": 3.9441467259500874e-08, "loss": 0.985, "step": 31372 }, { "epoch": 0.95, "learning_rate": 3.939832216386247e-08, "loss": 1.0582, "step": 31373 }, { "epoch": 0.95, "learning_rate": 3.9355200491967286e-08, "loss": 1.2156, "step": 31374 }, { "epoch": 0.95, "learning_rate": 3.931210224422527e-08, "loss": 1.0378, "step": 31375 }, { "epoch": 0.95, "learning_rate": 3.9269027421046934e-08, "loss": 1.0662, "step": 31376 }, { "epoch": 0.95, "learning_rate": 3.9225976022842224e-08, "loss": 1.0935, "step": 31377 }, { "epoch": 0.95, "learning_rate": 3.91829480500211e-08, "loss": 1.0378, "step": 31378 }, { "epoch": 0.95, "learning_rate": 3.9139943502993215e-08, "loss": 1.0526, "step": 31379 }, { "epoch": 0.95, "learning_rate": 3.9096962382167704e-08, "loss": 1.1819, "step": 31380 }, { "epoch": 0.95, "learning_rate": 3.9054004687954225e-08, "loss": 1.2688, "step": 31381 }, { "epoch": 0.95, "learning_rate": 3.9011070420761076e-08, "loss": 1.1224, "step": 31382 }, { "epoch": 0.95, "learning_rate": 3.896815958099764e-08, "loss": 1.0797, "step": 31383 }, { "epoch": 0.95, "learning_rate": 3.892527216907166e-08, "loss": 1.0425, "step": 31384 }, { "epoch": 0.95, "learning_rate": 3.888240818539224e-08, "loss": 1.0726, "step": 31385 }, { "epoch": 0.95, "learning_rate": 3.883956763036656e-08, "loss": 1.0914, "step": 31386 }, { "epoch": 0.95, "learning_rate": 3.8796750504402905e-08, "loss": 1.1438, "step": 31387 }, { "epoch": 0.95, "learning_rate": 3.8753956807909e-08, "loss": 1.0389, "step": 31388 }, { "epoch": 0.95, "learning_rate": 3.8711186541292026e-08, "loss": 1.1103, "step": 31389 }, { "epoch": 0.95, "learning_rate": 3.866843970495915e-08, "loss": 1.1515, "step": 31390 }, { "epoch": 0.95, "learning_rate": 3.862571629931727e-08, "loss": 1.0241, "step": 31391 }, { "epoch": 0.95, "learning_rate": 3.858301632477329e-08, "loss": 1.1274, "step": 31392 }, { "epoch": 0.95, "learning_rate": 3.854033978173327e-08, "loss": 0.9639, "step": 31393 }, { "epoch": 0.95, "learning_rate": 3.849768667060411e-08, "loss": 1.0943, "step": 31394 }, { "epoch": 0.95, "learning_rate": 3.845505699179103e-08, "loss": 1.1212, "step": 31395 }, { "epoch": 0.95, "learning_rate": 3.841245074570038e-08, "loss": 1.1123, "step": 31396 }, { "epoch": 0.95, "learning_rate": 3.836986793273767e-08, "loss": 1.1666, "step": 31397 }, { "epoch": 0.95, "learning_rate": 3.8327308553308684e-08, "loss": 1.0861, "step": 31398 }, { "epoch": 0.95, "learning_rate": 3.8284772607817544e-08, "loss": 1.1476, "step": 31399 }, { "epoch": 0.95, "learning_rate": 3.8242260096670033e-08, "loss": 1.129, "step": 31400 }, { "epoch": 0.95, "learning_rate": 3.819977102027056e-08, "loss": 0.9902, "step": 31401 }, { "epoch": 0.95, "learning_rate": 3.815730537902351e-08, "loss": 1.1179, "step": 31402 }, { "epoch": 0.95, "learning_rate": 3.8114863173333573e-08, "loss": 1.0357, "step": 31403 }, { "epoch": 0.95, "learning_rate": 3.807244440360403e-08, "loss": 1.1244, "step": 31404 }, { "epoch": 0.95, "learning_rate": 3.803004907023927e-08, "loss": 1.1122, "step": 31405 }, { "epoch": 0.95, "learning_rate": 3.798767717364288e-08, "loss": 1.0626, "step": 31406 }, { "epoch": 0.95, "learning_rate": 3.7945328714218133e-08, "loss": 1.1339, "step": 31407 }, { "epoch": 0.95, "learning_rate": 3.7903003692367765e-08, "loss": 1.1344, "step": 31408 }, { "epoch": 0.95, "learning_rate": 3.7860702108495075e-08, "loss": 1.1, "step": 31409 }, { "epoch": 0.95, "learning_rate": 3.781842396300278e-08, "loss": 1.1625, "step": 31410 }, { "epoch": 0.95, "learning_rate": 3.777616925629335e-08, "loss": 1.1097, "step": 31411 }, { "epoch": 0.95, "learning_rate": 3.773393798876895e-08, "loss": 1.2021, "step": 31412 }, { "epoch": 0.95, "learning_rate": 3.76917301608315e-08, "loss": 1.0907, "step": 31413 }, { "epoch": 0.95, "learning_rate": 3.7649545772882876e-08, "loss": 1.1416, "step": 31414 }, { "epoch": 0.95, "learning_rate": 3.760738482532444e-08, "loss": 1.1002, "step": 31415 }, { "epoch": 0.95, "learning_rate": 3.756524731855837e-08, "loss": 1.0687, "step": 31416 }, { "epoch": 0.95, "learning_rate": 3.7523133252984625e-08, "loss": 1.1426, "step": 31417 }, { "epoch": 0.95, "learning_rate": 3.748104262900482e-08, "loss": 1.0715, "step": 31418 }, { "epoch": 0.95, "learning_rate": 3.743897544701974e-08, "loss": 1.0733, "step": 31419 }, { "epoch": 0.95, "learning_rate": 3.739693170742964e-08, "loss": 0.9744, "step": 31420 }, { "epoch": 0.95, "learning_rate": 3.7354911410634466e-08, "loss": 1.1348, "step": 31421 }, { "epoch": 0.95, "learning_rate": 3.731291455703445e-08, "loss": 1.1467, "step": 31422 }, { "epoch": 0.95, "learning_rate": 3.7270941147029284e-08, "loss": 1.1621, "step": 31423 }, { "epoch": 0.95, "learning_rate": 3.722899118101919e-08, "loss": 1.0722, "step": 31424 }, { "epoch": 0.95, "learning_rate": 3.718706465940247e-08, "loss": 1.1227, "step": 31425 }, { "epoch": 0.95, "learning_rate": 3.714516158257908e-08, "loss": 1.0883, "step": 31426 }, { "epoch": 0.95, "learning_rate": 3.710328195094731e-08, "loss": 1.0999, "step": 31427 }, { "epoch": 0.95, "learning_rate": 3.706142576490629e-08, "loss": 1.0803, "step": 31428 }, { "epoch": 0.95, "learning_rate": 3.7019593024854305e-08, "loss": 1.1499, "step": 31429 }, { "epoch": 0.95, "learning_rate": 3.697778373118965e-08, "loss": 1.1291, "step": 31430 }, { "epoch": 0.95, "learning_rate": 3.693599788431007e-08, "loss": 1.0064, "step": 31431 }, { "epoch": 0.95, "learning_rate": 3.689423548461385e-08, "loss": 1.0197, "step": 31432 }, { "epoch": 0.95, "learning_rate": 3.685249653249817e-08, "loss": 1.0422, "step": 31433 }, { "epoch": 0.95, "learning_rate": 3.681078102836022e-08, "loss": 1.1389, "step": 31434 }, { "epoch": 0.95, "learning_rate": 3.6769088972597454e-08, "loss": 1.1537, "step": 31435 }, { "epoch": 0.95, "learning_rate": 3.67274203656065e-08, "loss": 1.1943, "step": 31436 }, { "epoch": 0.95, "learning_rate": 3.6685775207784547e-08, "loss": 1.0862, "step": 31437 }, { "epoch": 0.95, "learning_rate": 3.66441534995271e-08, "loss": 1.0281, "step": 31438 }, { "epoch": 0.95, "learning_rate": 3.660255524123135e-08, "loss": 1.0544, "step": 31439 }, { "epoch": 0.95, "learning_rate": 3.6560980433292537e-08, "loss": 1.0928, "step": 31440 }, { "epoch": 0.95, "learning_rate": 3.651942907610701e-08, "loss": 1.1208, "step": 31441 }, { "epoch": 0.95, "learning_rate": 3.647790117007e-08, "loss": 1.1169, "step": 31442 }, { "epoch": 0.95, "learning_rate": 3.643639671557675e-08, "loss": 1.1985, "step": 31443 }, { "epoch": 0.95, "learning_rate": 3.639491571302251e-08, "loss": 1.1608, "step": 31444 }, { "epoch": 0.95, "learning_rate": 3.635345816280222e-08, "loss": 1.1265, "step": 31445 }, { "epoch": 0.95, "learning_rate": 3.631202406531087e-08, "loss": 0.9989, "step": 31446 }, { "epoch": 0.95, "learning_rate": 3.6270613420942016e-08, "loss": 1.0878, "step": 31447 }, { "epoch": 0.95, "learning_rate": 3.6229226230090345e-08, "loss": 0.9052, "step": 31448 }, { "epoch": 0.95, "learning_rate": 3.618786249314998e-08, "loss": 1.1171, "step": 31449 }, { "epoch": 0.95, "learning_rate": 3.614652221051479e-08, "loss": 1.1998, "step": 31450 }, { "epoch": 0.95, "learning_rate": 3.610520538257778e-08, "loss": 1.0989, "step": 31451 }, { "epoch": 0.95, "learning_rate": 3.6063912009732524e-08, "loss": 1.0605, "step": 31452 }, { "epoch": 0.95, "learning_rate": 3.602264209237233e-08, "loss": 1.0717, "step": 31453 }, { "epoch": 0.95, "learning_rate": 3.598139563088965e-08, "loss": 1.0312, "step": 31454 }, { "epoch": 0.95, "learning_rate": 3.594017262567751e-08, "loss": 1.2422, "step": 31455 }, { "epoch": 0.95, "learning_rate": 3.589897307712836e-08, "loss": 1.1844, "step": 31456 }, { "epoch": 0.95, "learning_rate": 3.585779698563413e-08, "loss": 1.0809, "step": 31457 }, { "epoch": 0.95, "learning_rate": 3.5816644351586715e-08, "loss": 1.0884, "step": 31458 }, { "epoch": 0.95, "learning_rate": 3.577551517537831e-08, "loss": 1.0977, "step": 31459 }, { "epoch": 0.95, "learning_rate": 3.573440945739998e-08, "loss": 1.1385, "step": 31460 }, { "epoch": 0.95, "learning_rate": 3.569332719804336e-08, "loss": 1.1343, "step": 31461 }, { "epoch": 0.95, "learning_rate": 3.5652268397699253e-08, "loss": 1.0176, "step": 31462 }, { "epoch": 0.95, "learning_rate": 3.561123305675901e-08, "loss": 1.126, "step": 31463 }, { "epoch": 0.95, "learning_rate": 3.5570221175612874e-08, "loss": 1.1039, "step": 31464 }, { "epoch": 0.95, "learning_rate": 3.552923275465109e-08, "loss": 0.976, "step": 31465 }, { "epoch": 0.95, "learning_rate": 3.5488267794264173e-08, "loss": 1.1548, "step": 31466 }, { "epoch": 0.95, "learning_rate": 3.54473262948421e-08, "loss": 1.0455, "step": 31467 }, { "epoch": 0.95, "learning_rate": 3.540640825677455e-08, "loss": 1.1624, "step": 31468 }, { "epoch": 0.95, "learning_rate": 3.536551368045066e-08, "loss": 1.2686, "step": 31469 }, { "epoch": 0.95, "learning_rate": 3.532464256626039e-08, "loss": 0.9628, "step": 31470 }, { "epoch": 0.95, "learning_rate": 3.528379491459233e-08, "loss": 1.0821, "step": 31471 }, { "epoch": 0.95, "learning_rate": 3.52429707258356e-08, "loss": 1.0558, "step": 31472 }, { "epoch": 0.95, "learning_rate": 3.520217000037879e-08, "loss": 1.0612, "step": 31473 }, { "epoch": 0.95, "learning_rate": 3.516139273860991e-08, "loss": 1.1641, "step": 31474 }, { "epoch": 0.95, "learning_rate": 3.5120638940917825e-08, "loss": 1.1937, "step": 31475 }, { "epoch": 0.95, "learning_rate": 3.507990860769001e-08, "loss": 1.1295, "step": 31476 }, { "epoch": 0.95, "learning_rate": 3.5039201739314465e-08, "loss": 1.1244, "step": 31477 }, { "epoch": 0.95, "learning_rate": 3.4998518336178125e-08, "loss": 1.121, "step": 31478 }, { "epoch": 0.95, "learning_rate": 3.4957858398668996e-08, "loss": 1.1971, "step": 31479 }, { "epoch": 0.95, "learning_rate": 3.4917221927174005e-08, "loss": 1.1301, "step": 31480 }, { "epoch": 0.95, "learning_rate": 3.48766089220795e-08, "loss": 1.1052, "step": 31481 }, { "epoch": 0.95, "learning_rate": 3.483601938377268e-08, "loss": 1.0472, "step": 31482 }, { "epoch": 0.95, "learning_rate": 3.479545331263961e-08, "loss": 1.0968, "step": 31483 }, { "epoch": 0.95, "learning_rate": 3.4754910709066395e-08, "loss": 1.0298, "step": 31484 }, { "epoch": 0.95, "learning_rate": 3.4714391573439364e-08, "loss": 1.1024, "step": 31485 }, { "epoch": 0.95, "learning_rate": 3.467389590614378e-08, "loss": 1.0484, "step": 31486 }, { "epoch": 0.95, "learning_rate": 3.463342370756545e-08, "loss": 1.2637, "step": 31487 }, { "epoch": 0.95, "learning_rate": 3.459297497808961e-08, "loss": 1.1083, "step": 31488 }, { "epoch": 0.95, "learning_rate": 3.4552549718101235e-08, "loss": 1.1856, "step": 31489 }, { "epoch": 0.95, "learning_rate": 3.45121479279853e-08, "loss": 1.145, "step": 31490 }, { "epoch": 0.95, "learning_rate": 3.44717696081262e-08, "loss": 0.9855, "step": 31491 }, { "epoch": 0.95, "learning_rate": 3.443141475890838e-08, "loss": 1.1926, "step": 31492 }, { "epoch": 0.95, "learning_rate": 3.4391083380716226e-08, "loss": 1.1484, "step": 31493 }, { "epoch": 0.95, "learning_rate": 3.435077547393334e-08, "loss": 1.0171, "step": 31494 }, { "epoch": 0.95, "learning_rate": 3.4310491038943295e-08, "loss": 1.1702, "step": 31495 }, { "epoch": 0.95, "learning_rate": 3.427023007613023e-08, "loss": 1.0646, "step": 31496 }, { "epoch": 0.95, "learning_rate": 3.4229992585876894e-08, "loss": 1.0496, "step": 31497 }, { "epoch": 0.95, "learning_rate": 3.418977856856659e-08, "loss": 1.2072, "step": 31498 }, { "epoch": 0.95, "learning_rate": 3.4149588024581795e-08, "loss": 1.1514, "step": 31499 }, { "epoch": 0.95, "learning_rate": 3.410942095430553e-08, "loss": 1.1168, "step": 31500 }, { "epoch": 0.95, "learning_rate": 3.406927735811999e-08, "loss": 1.1107, "step": 31501 }, { "epoch": 0.95, "learning_rate": 3.402915723640737e-08, "loss": 1.0904, "step": 31502 }, { "epoch": 0.95, "learning_rate": 3.398906058954932e-08, "loss": 1.0551, "step": 31503 }, { "epoch": 0.95, "learning_rate": 3.394898741792774e-08, "loss": 1.1683, "step": 31504 }, { "epoch": 0.95, "learning_rate": 3.3908937721923996e-08, "loss": 1.0784, "step": 31505 }, { "epoch": 0.95, "learning_rate": 3.3868911501919734e-08, "loss": 1.1148, "step": 31506 }, { "epoch": 0.95, "learning_rate": 3.382890875829575e-08, "loss": 0.9568, "step": 31507 }, { "epoch": 0.95, "learning_rate": 3.378892949143259e-08, "loss": 1.1003, "step": 31508 }, { "epoch": 0.95, "learning_rate": 3.374897370171104e-08, "loss": 1.0888, "step": 31509 }, { "epoch": 0.95, "learning_rate": 3.370904138951137e-08, "loss": 1.0776, "step": 31510 }, { "epoch": 0.95, "learning_rate": 3.366913255521409e-08, "loss": 1.0456, "step": 31511 }, { "epoch": 0.95, "learning_rate": 3.3629247199198636e-08, "loss": 1.1575, "step": 31512 }, { "epoch": 0.95, "learning_rate": 3.358938532184497e-08, "loss": 1.0754, "step": 31513 }, { "epoch": 0.95, "learning_rate": 3.3549546923532516e-08, "loss": 1.129, "step": 31514 }, { "epoch": 0.95, "learning_rate": 3.3509732004640696e-08, "loss": 1.1734, "step": 31515 }, { "epoch": 0.95, "learning_rate": 3.3469940565548085e-08, "loss": 0.99, "step": 31516 }, { "epoch": 0.95, "learning_rate": 3.343017260663356e-08, "loss": 1.1145, "step": 31517 }, { "epoch": 0.95, "learning_rate": 3.3390428128275974e-08, "loss": 1.0988, "step": 31518 }, { "epoch": 0.95, "learning_rate": 3.335070713085392e-08, "loss": 1.0905, "step": 31519 }, { "epoch": 0.95, "learning_rate": 3.3311009614744874e-08, "loss": 1.0893, "step": 31520 }, { "epoch": 0.95, "learning_rate": 3.327133558032686e-08, "loss": 1.1277, "step": 31521 }, { "epoch": 0.95, "learning_rate": 3.3231685027977913e-08, "loss": 1.0746, "step": 31522 }, { "epoch": 0.95, "learning_rate": 3.319205795807523e-08, "loss": 1.0671, "step": 31523 }, { "epoch": 0.95, "learning_rate": 3.315245437099629e-08, "loss": 1.2902, "step": 31524 }, { "epoch": 0.95, "learning_rate": 3.3112874267117736e-08, "loss": 1.2043, "step": 31525 }, { "epoch": 0.95, "learning_rate": 3.307331764681648e-08, "loss": 1.1623, "step": 31526 }, { "epoch": 0.95, "learning_rate": 3.303378451046918e-08, "loss": 1.0027, "step": 31527 }, { "epoch": 0.95, "learning_rate": 3.2994274858452194e-08, "loss": 1.0967, "step": 31528 }, { "epoch": 0.95, "learning_rate": 3.295478869114133e-08, "loss": 1.072, "step": 31529 }, { "epoch": 0.95, "learning_rate": 3.291532600891295e-08, "loss": 1.0264, "step": 31530 }, { "epoch": 0.95, "learning_rate": 3.287588681214232e-08, "loss": 1.1513, "step": 31531 }, { "epoch": 0.95, "learning_rate": 3.283647110120525e-08, "loss": 1.0728, "step": 31532 }, { "epoch": 0.95, "learning_rate": 3.279707887647643e-08, "loss": 1.1151, "step": 31533 }, { "epoch": 0.95, "learning_rate": 3.27577101383314e-08, "loss": 1.1074, "step": 31534 }, { "epoch": 0.95, "learning_rate": 3.271836488714458e-08, "loss": 1.0071, "step": 31535 }, { "epoch": 0.95, "learning_rate": 3.2679043123290676e-08, "loss": 1.1661, "step": 31536 }, { "epoch": 0.95, "learning_rate": 3.2639744847144105e-08, "loss": 1.0304, "step": 31537 }, { "epoch": 0.95, "learning_rate": 3.260047005907874e-08, "loss": 1.144, "step": 31538 }, { "epoch": 0.95, "learning_rate": 3.256121875946844e-08, "loss": 1.188, "step": 31539 }, { "epoch": 0.95, "learning_rate": 3.2521990948687074e-08, "loss": 1.0489, "step": 31540 }, { "epoch": 0.95, "learning_rate": 3.2482786627108246e-08, "loss": 1.0306, "step": 31541 }, { "epoch": 0.95, "learning_rate": 3.2443605795104414e-08, "loss": 1.108, "step": 31542 }, { "epoch": 0.95, "learning_rate": 3.2404448453049185e-08, "loss": 1.0966, "step": 31543 }, { "epoch": 0.95, "learning_rate": 3.236531460131531e-08, "loss": 0.9435, "step": 31544 }, { "epoch": 0.95, "learning_rate": 3.2326204240275275e-08, "loss": 1.0588, "step": 31545 }, { "epoch": 0.95, "learning_rate": 3.228711737030127e-08, "loss": 1.0668, "step": 31546 }, { "epoch": 0.95, "learning_rate": 3.224805399176523e-08, "loss": 1.0993, "step": 31547 }, { "epoch": 0.95, "learning_rate": 3.220901410503935e-08, "loss": 1.1986, "step": 31548 }, { "epoch": 0.95, "learning_rate": 3.2169997710495007e-08, "loss": 1.0876, "step": 31549 }, { "epoch": 0.95, "learning_rate": 3.213100480850384e-08, "loss": 1.0823, "step": 31550 }, { "epoch": 0.95, "learning_rate": 3.209203539943695e-08, "loss": 1.1413, "step": 31551 }, { "epoch": 0.95, "learning_rate": 3.2053089483665145e-08, "loss": 1.1374, "step": 31552 }, { "epoch": 0.95, "learning_rate": 3.201416706155952e-08, "loss": 1.0918, "step": 31553 }, { "epoch": 0.95, "learning_rate": 3.1975268133490334e-08, "loss": 1.1027, "step": 31554 }, { "epoch": 0.95, "learning_rate": 3.193639269982785e-08, "loss": 1.1232, "step": 31555 }, { "epoch": 0.95, "learning_rate": 3.1897540760942316e-08, "loss": 1.1776, "step": 31556 }, { "epoch": 0.95, "learning_rate": 3.1858712317203445e-08, "loss": 1.0901, "step": 31557 }, { "epoch": 0.95, "learning_rate": 3.181990736898122e-08, "loss": 1.0369, "step": 31558 }, { "epoch": 0.95, "learning_rate": 3.1781125916644506e-08, "loss": 1.1297, "step": 31559 }, { "epoch": 0.95, "learning_rate": 3.1742367960562734e-08, "loss": 1.1437, "step": 31560 }, { "epoch": 0.95, "learning_rate": 3.170363350110506e-08, "loss": 1.1476, "step": 31561 }, { "epoch": 0.95, "learning_rate": 3.1664922538639786e-08, "loss": 1.1649, "step": 31562 }, { "epoch": 0.95, "learning_rate": 3.1626235073535794e-08, "loss": 1.1917, "step": 31563 }, { "epoch": 0.95, "learning_rate": 3.158757110616112e-08, "loss": 1.0338, "step": 31564 }, { "epoch": 0.95, "learning_rate": 3.154893063688408e-08, "loss": 1.0951, "step": 31565 }, { "epoch": 0.95, "learning_rate": 3.151031366607243e-08, "loss": 1.0902, "step": 31566 }, { "epoch": 0.95, "learning_rate": 3.1471720194093393e-08, "loss": 1.0631, "step": 31567 }, { "epoch": 0.95, "learning_rate": 3.143315022131499e-08, "loss": 1.1923, "step": 31568 }, { "epoch": 0.95, "learning_rate": 3.139460374810388e-08, "loss": 1.1141, "step": 31569 }, { "epoch": 0.95, "learning_rate": 3.135608077482727e-08, "loss": 1.0709, "step": 31570 }, { "epoch": 0.95, "learning_rate": 3.131758130185209e-08, "loss": 1.0577, "step": 31571 }, { "epoch": 0.95, "learning_rate": 3.1279105329544424e-08, "loss": 1.1088, "step": 31572 }, { "epoch": 0.95, "learning_rate": 3.124065285827066e-08, "loss": 1.0387, "step": 31573 }, { "epoch": 0.95, "learning_rate": 3.120222388839689e-08, "loss": 1.1251, "step": 31574 }, { "epoch": 0.95, "learning_rate": 3.116381842028893e-08, "loss": 1.1627, "step": 31575 }, { "epoch": 0.95, "learning_rate": 3.1125436454312596e-08, "loss": 1.0859, "step": 31576 }, { "epoch": 0.95, "learning_rate": 3.1087077990832884e-08, "loss": 1.0309, "step": 31577 }, { "epoch": 0.95, "learning_rate": 3.1048743030215045e-08, "loss": 1.0637, "step": 31578 }, { "epoch": 0.95, "learning_rate": 3.1010431572824076e-08, "loss": 1.172, "step": 31579 }, { "epoch": 0.95, "learning_rate": 3.097214361902495e-08, "loss": 0.9759, "step": 31580 }, { "epoch": 0.95, "learning_rate": 3.093387916918156e-08, "loss": 1.1745, "step": 31581 }, { "epoch": 0.95, "learning_rate": 3.08956382236586e-08, "loss": 1.0676, "step": 31582 }, { "epoch": 0.95, "learning_rate": 3.0857420782819946e-08, "loss": 1.0638, "step": 31583 }, { "epoch": 0.95, "learning_rate": 3.0819226847029756e-08, "loss": 1.1385, "step": 31584 }, { "epoch": 0.95, "learning_rate": 3.078105641665108e-08, "loss": 1.0262, "step": 31585 }, { "epoch": 0.95, "learning_rate": 3.07429094920475e-08, "loss": 1.0513, "step": 31586 }, { "epoch": 0.95, "learning_rate": 3.070478607358235e-08, "loss": 1.2334, "step": 31587 }, { "epoch": 0.95, "learning_rate": 3.0666686161618385e-08, "loss": 1.1061, "step": 31588 }, { "epoch": 0.95, "learning_rate": 3.062860975651838e-08, "loss": 1.0944, "step": 31589 }, { "epoch": 0.95, "learning_rate": 3.0590556858644535e-08, "loss": 0.9818, "step": 31590 }, { "epoch": 0.95, "learning_rate": 3.055252746835907e-08, "loss": 1.1486, "step": 31591 }, { "epoch": 0.95, "learning_rate": 3.051452158602447e-08, "loss": 1.2701, "step": 31592 }, { "epoch": 0.95, "learning_rate": 3.047653921200211e-08, "loss": 1.1021, "step": 31593 }, { "epoch": 0.95, "learning_rate": 3.043858034665392e-08, "loss": 1.0496, "step": 31594 }, { "epoch": 0.95, "learning_rate": 3.040064499034101e-08, "loss": 1.1465, "step": 31595 }, { "epoch": 0.95, "learning_rate": 3.036273314342447e-08, "loss": 1.1174, "step": 31596 }, { "epoch": 0.95, "learning_rate": 3.032484480626569e-08, "loss": 1.1791, "step": 31597 }, { "epoch": 0.95, "learning_rate": 3.028697997922464e-08, "loss": 1.063, "step": 31598 }, { "epoch": 0.95, "learning_rate": 3.024913866266216e-08, "loss": 1.1036, "step": 31599 }, { "epoch": 0.95, "learning_rate": 3.021132085693823e-08, "loss": 1.0618, "step": 31600 }, { "epoch": 0.95, "learning_rate": 3.0173526562413125e-08, "loss": 1.0566, "step": 31601 }, { "epoch": 0.95, "learning_rate": 3.013575577944655e-08, "loss": 1.1265, "step": 31602 }, { "epoch": 0.95, "learning_rate": 3.0098008508398226e-08, "loss": 1.1, "step": 31603 }, { "epoch": 0.95, "learning_rate": 3.006028474962702e-08, "loss": 1.1471, "step": 31604 }, { "epoch": 0.95, "learning_rate": 3.002258450349238e-08, "loss": 1.0576, "step": 31605 }, { "epoch": 0.95, "learning_rate": 2.998490777035346e-08, "loss": 1.1082, "step": 31606 }, { "epoch": 0.95, "learning_rate": 2.99472545505683e-08, "loss": 1.0843, "step": 31607 }, { "epoch": 0.95, "learning_rate": 2.990962484449578e-08, "loss": 1.1512, "step": 31608 }, { "epoch": 0.95, "learning_rate": 2.987201865249395e-08, "loss": 1.038, "step": 31609 }, { "epoch": 0.95, "learning_rate": 2.9834435974921136e-08, "loss": 1.1807, "step": 31610 }, { "epoch": 0.95, "learning_rate": 2.9796876812134557e-08, "loss": 1.089, "step": 31611 }, { "epoch": 0.95, "learning_rate": 2.9759341164491973e-08, "loss": 1.0756, "step": 31612 }, { "epoch": 0.95, "learning_rate": 2.9721829032350602e-08, "loss": 1.1522, "step": 31613 }, { "epoch": 0.95, "learning_rate": 2.9684340416067936e-08, "loss": 1.1628, "step": 31614 }, { "epoch": 0.95, "learning_rate": 2.964687531600091e-08, "loss": 1.0606, "step": 31615 }, { "epoch": 0.95, "learning_rate": 2.9609433732505354e-08, "loss": 1.0796, "step": 31616 }, { "epoch": 0.95, "learning_rate": 2.957201566593848e-08, "loss": 1.1301, "step": 31617 }, { "epoch": 0.95, "learning_rate": 2.9534621116655837e-08, "loss": 1.1014, "step": 31618 }, { "epoch": 0.95, "learning_rate": 2.9497250085014083e-08, "loss": 1.1918, "step": 31619 }, { "epoch": 0.95, "learning_rate": 2.945990257136877e-08, "loss": 1.2373, "step": 31620 }, { "epoch": 0.95, "learning_rate": 2.9422578576075167e-08, "loss": 1.1245, "step": 31621 }, { "epoch": 0.95, "learning_rate": 2.9385278099488825e-08, "loss": 1.0057, "step": 31622 }, { "epoch": 0.95, "learning_rate": 2.9348001141964733e-08, "loss": 1.0936, "step": 31623 }, { "epoch": 0.95, "learning_rate": 2.931074770385761e-08, "loss": 1.0774, "step": 31624 }, { "epoch": 0.95, "learning_rate": 2.9273517785522453e-08, "loss": 1.0558, "step": 31625 }, { "epoch": 0.95, "learning_rate": 2.923631138731342e-08, "loss": 1.1724, "step": 31626 }, { "epoch": 0.95, "learning_rate": 2.9199128509584673e-08, "loss": 1.1647, "step": 31627 }, { "epoch": 0.95, "learning_rate": 2.916196915269037e-08, "loss": 1.0874, "step": 31628 }, { "epoch": 0.95, "learning_rate": 2.9124833316984125e-08, "loss": 1.1579, "step": 31629 }, { "epoch": 0.95, "learning_rate": 2.908772100281926e-08, "loss": 1.1281, "step": 31630 }, { "epoch": 0.95, "learning_rate": 2.905063221054938e-08, "loss": 1.0004, "step": 31631 }, { "epoch": 0.95, "learning_rate": 2.901356694052754e-08, "loss": 1.0513, "step": 31632 }, { "epoch": 0.95, "learning_rate": 2.897652519310623e-08, "loss": 1.1047, "step": 31633 }, { "epoch": 0.95, "learning_rate": 2.8939506968638507e-08, "loss": 1.0131, "step": 31634 }, { "epoch": 0.95, "learning_rate": 2.8902512267476313e-08, "loss": 1.0767, "step": 31635 }, { "epoch": 0.95, "learning_rate": 2.8865541089972416e-08, "loss": 1.0568, "step": 31636 }, { "epoch": 0.95, "learning_rate": 2.8828593436478204e-08, "loss": 1.244, "step": 31637 }, { "epoch": 0.95, "learning_rate": 2.8791669307345893e-08, "loss": 1.1074, "step": 31638 }, { "epoch": 0.95, "learning_rate": 2.8754768702926316e-08, "loss": 1.0723, "step": 31639 }, { "epoch": 0.95, "learning_rate": 2.8717891623571413e-08, "loss": 1.1467, "step": 31640 }, { "epoch": 0.95, "learning_rate": 2.8681038069632017e-08, "loss": 1.0777, "step": 31641 }, { "epoch": 0.95, "learning_rate": 2.8644208041458678e-08, "loss": 1.0977, "step": 31642 }, { "epoch": 0.95, "learning_rate": 2.86074015394025e-08, "loss": 1.0938, "step": 31643 }, { "epoch": 0.95, "learning_rate": 2.857061856381349e-08, "loss": 1.2059, "step": 31644 }, { "epoch": 0.95, "learning_rate": 2.8533859115041918e-08, "loss": 1.1918, "step": 31645 }, { "epoch": 0.95, "learning_rate": 2.8497123193437503e-08, "loss": 1.0439, "step": 31646 }, { "epoch": 0.95, "learning_rate": 2.8460410799350524e-08, "loss": 1.0013, "step": 31647 }, { "epoch": 0.95, "learning_rate": 2.8423721933129867e-08, "loss": 1.059, "step": 31648 }, { "epoch": 0.95, "learning_rate": 2.8387056595124974e-08, "loss": 1.1011, "step": 31649 }, { "epoch": 0.95, "learning_rate": 2.835041478568501e-08, "loss": 1.1841, "step": 31650 }, { "epoch": 0.95, "learning_rate": 2.8313796505158587e-08, "loss": 1.0979, "step": 31651 }, { "epoch": 0.95, "learning_rate": 2.827720175389459e-08, "loss": 0.9609, "step": 31652 }, { "epoch": 0.95, "learning_rate": 2.8240630532241354e-08, "loss": 1.1073, "step": 31653 }, { "epoch": 0.95, "learning_rate": 2.8204082840546655e-08, "loss": 1.1108, "step": 31654 }, { "epoch": 0.95, "learning_rate": 2.8167558679158547e-08, "loss": 1.1296, "step": 31655 }, { "epoch": 0.95, "learning_rate": 2.8131058048424808e-08, "loss": 1.1682, "step": 31656 }, { "epoch": 0.95, "learning_rate": 2.809458094869294e-08, "loss": 1.1203, "step": 31657 }, { "epoch": 0.95, "learning_rate": 2.805812738031044e-08, "loss": 1.0108, "step": 31658 }, { "epoch": 0.95, "learning_rate": 2.8021697343623976e-08, "loss": 1.0049, "step": 31659 }, { "epoch": 0.95, "learning_rate": 2.7985290838980217e-08, "loss": 1.1871, "step": 31660 }, { "epoch": 0.95, "learning_rate": 2.7948907866725826e-08, "loss": 1.0908, "step": 31661 }, { "epoch": 0.95, "learning_rate": 2.7912548427207474e-08, "loss": 1.0544, "step": 31662 }, { "epoch": 0.95, "learning_rate": 2.7876212520770996e-08, "loss": 1.2231, "step": 31663 }, { "epoch": 0.95, "learning_rate": 2.7839900147762222e-08, "loss": 1.0737, "step": 31664 }, { "epoch": 0.95, "learning_rate": 2.7803611308527268e-08, "loss": 1.1772, "step": 31665 }, { "epoch": 0.95, "learning_rate": 2.776734600341113e-08, "loss": 1.0494, "step": 31666 }, { "epoch": 0.95, "learning_rate": 2.7731104232759097e-08, "loss": 1.1582, "step": 31667 }, { "epoch": 0.95, "learning_rate": 2.7694885996916444e-08, "loss": 1.1364, "step": 31668 }, { "epoch": 0.95, "learning_rate": 2.7658691296227612e-08, "loss": 1.0491, "step": 31669 }, { "epoch": 0.95, "learning_rate": 2.7622520131037335e-08, "loss": 1.0371, "step": 31670 }, { "epoch": 0.95, "learning_rate": 2.758637250169005e-08, "loss": 1.0009, "step": 31671 }, { "epoch": 0.95, "learning_rate": 2.7550248408529656e-08, "loss": 1.0231, "step": 31672 }, { "epoch": 0.95, "learning_rate": 2.7514147851900043e-08, "loss": 1.161, "step": 31673 }, { "epoch": 0.95, "learning_rate": 2.7478070832145098e-08, "loss": 1.1445, "step": 31674 }, { "epoch": 0.95, "learning_rate": 2.7442017349607887e-08, "loss": 1.0769, "step": 31675 }, { "epoch": 0.95, "learning_rate": 2.7405987404632016e-08, "loss": 1.0546, "step": 31676 }, { "epoch": 0.95, "learning_rate": 2.7369980997560274e-08, "loss": 1.0065, "step": 31677 }, { "epoch": 0.95, "learning_rate": 2.733399812873544e-08, "loss": 1.0503, "step": 31678 }, { "epoch": 0.95, "learning_rate": 2.729803879850029e-08, "loss": 1.0737, "step": 31679 }, { "epoch": 0.95, "learning_rate": 2.7262103007196507e-08, "loss": 1.1865, "step": 31680 }, { "epoch": 0.95, "learning_rate": 2.722619075516686e-08, "loss": 1.183, "step": 31681 }, { "epoch": 0.95, "learning_rate": 2.7190302042753026e-08, "loss": 1.0958, "step": 31682 }, { "epoch": 0.95, "learning_rate": 2.7154436870296396e-08, "loss": 1.0705, "step": 31683 }, { "epoch": 0.95, "learning_rate": 2.7118595238138644e-08, "loss": 1.2155, "step": 31684 }, { "epoch": 0.95, "learning_rate": 2.7082777146620887e-08, "loss": 1.0048, "step": 31685 }, { "epoch": 0.95, "learning_rate": 2.704698259608396e-08, "loss": 1.0698, "step": 31686 }, { "epoch": 0.95, "learning_rate": 2.701121158686898e-08, "loss": 1.2202, "step": 31687 }, { "epoch": 0.95, "learning_rate": 2.697546411931623e-08, "loss": 1.1172, "step": 31688 }, { "epoch": 0.95, "learning_rate": 2.6939740193765717e-08, "loss": 1.0899, "step": 31689 }, { "epoch": 0.95, "learning_rate": 2.6904039810558e-08, "loss": 1.1354, "step": 31690 }, { "epoch": 0.95, "learning_rate": 2.6868362970032536e-08, "loss": 1.0944, "step": 31691 }, { "epoch": 0.95, "learning_rate": 2.68327096725296e-08, "loss": 1.139, "step": 31692 }, { "epoch": 0.95, "learning_rate": 2.6797079918387814e-08, "loss": 1.0884, "step": 31693 }, { "epoch": 0.95, "learning_rate": 2.676147370794663e-08, "loss": 1.0737, "step": 31694 }, { "epoch": 0.95, "learning_rate": 2.6725891041545215e-08, "loss": 1.1564, "step": 31695 }, { "epoch": 0.95, "learning_rate": 2.6690331919522195e-08, "loss": 1.0555, "step": 31696 }, { "epoch": 0.95, "learning_rate": 2.6654796342215906e-08, "loss": 0.9927, "step": 31697 }, { "epoch": 0.95, "learning_rate": 2.6619284309964967e-08, "loss": 1.1092, "step": 31698 }, { "epoch": 0.95, "learning_rate": 2.6583795823106883e-08, "loss": 1.0738, "step": 31699 }, { "epoch": 0.95, "learning_rate": 2.654833088198e-08, "loss": 0.8464, "step": 31700 }, { "epoch": 0.95, "learning_rate": 2.651288948692182e-08, "loss": 1.0446, "step": 31701 }, { "epoch": 0.96, "learning_rate": 2.647747163826958e-08, "loss": 1.0563, "step": 31702 }, { "epoch": 0.96, "learning_rate": 2.6442077336360507e-08, "loss": 1.0753, "step": 31703 }, { "epoch": 0.96, "learning_rate": 2.640670658153155e-08, "loss": 1.025, "step": 31704 }, { "epoch": 0.96, "learning_rate": 2.637135937411939e-08, "loss": 1.0263, "step": 31705 }, { "epoch": 0.96, "learning_rate": 2.6336035714460694e-08, "loss": 1.2407, "step": 31706 }, { "epoch": 0.96, "learning_rate": 2.6300735602891592e-08, "loss": 1.0504, "step": 31707 }, { "epoch": 0.96, "learning_rate": 2.626545903974792e-08, "loss": 1.095, "step": 31708 }, { "epoch": 0.96, "learning_rate": 2.62302060253658e-08, "loss": 1.0777, "step": 31709 }, { "epoch": 0.96, "learning_rate": 2.61949765600808e-08, "loss": 1.0698, "step": 31710 }, { "epoch": 0.96, "learning_rate": 2.615977064422792e-08, "loss": 1.0461, "step": 31711 }, { "epoch": 0.96, "learning_rate": 2.612458827814274e-08, "loss": 1.0748, "step": 31712 }, { "epoch": 0.96, "learning_rate": 2.6089429462159977e-08, "loss": 1.1604, "step": 31713 }, { "epoch": 0.96, "learning_rate": 2.6054294196614648e-08, "loss": 0.982, "step": 31714 }, { "epoch": 0.96, "learning_rate": 2.6019182481840656e-08, "loss": 1.0074, "step": 31715 }, { "epoch": 0.96, "learning_rate": 2.5984094318172726e-08, "loss": 1.1023, "step": 31716 }, { "epoch": 0.96, "learning_rate": 2.5949029705944485e-08, "loss": 1.0792, "step": 31717 }, { "epoch": 0.96, "learning_rate": 2.5913988645490106e-08, "loss": 1.0964, "step": 31718 }, { "epoch": 0.96, "learning_rate": 2.587897113714294e-08, "loss": 1.1261, "step": 31719 }, { "epoch": 0.96, "learning_rate": 2.5843977181236323e-08, "loss": 1.061, "step": 31720 }, { "epoch": 0.96, "learning_rate": 2.580900677810333e-08, "loss": 1.0582, "step": 31721 }, { "epoch": 0.96, "learning_rate": 2.5774059928077022e-08, "loss": 0.9902, "step": 31722 }, { "epoch": 0.96, "learning_rate": 2.573913663149047e-08, "loss": 1.0526, "step": 31723 }, { "epoch": 0.96, "learning_rate": 2.570423688867535e-08, "loss": 1.2159, "step": 31724 }, { "epoch": 0.96, "learning_rate": 2.5669360699964174e-08, "loss": 1.1601, "step": 31725 }, { "epoch": 0.96, "learning_rate": 2.56345080656889e-08, "loss": 1.0591, "step": 31726 }, { "epoch": 0.96, "learning_rate": 2.5599678986181764e-08, "loss": 1.0803, "step": 31727 }, { "epoch": 0.96, "learning_rate": 2.5564873461773888e-08, "loss": 0.9761, "step": 31728 }, { "epoch": 0.96, "learning_rate": 2.5530091492796672e-08, "loss": 1.0788, "step": 31729 }, { "epoch": 0.96, "learning_rate": 2.5495333079580963e-08, "loss": 1.0491, "step": 31730 }, { "epoch": 0.96, "learning_rate": 2.5460598222458165e-08, "loss": 1.1404, "step": 31731 }, { "epoch": 0.96, "learning_rate": 2.542588692175857e-08, "loss": 1.1196, "step": 31732 }, { "epoch": 0.96, "learning_rate": 2.539119917781302e-08, "loss": 1.0057, "step": 31733 }, { "epoch": 0.96, "learning_rate": 2.5356534990950976e-08, "loss": 1.0253, "step": 31734 }, { "epoch": 0.96, "learning_rate": 2.5321894361503285e-08, "loss": 1.0493, "step": 31735 }, { "epoch": 0.96, "learning_rate": 2.5287277289799405e-08, "loss": 1.0596, "step": 31736 }, { "epoch": 0.96, "learning_rate": 2.525268377616852e-08, "loss": 1.1375, "step": 31737 }, { "epoch": 0.96, "learning_rate": 2.521811382094008e-08, "loss": 1.0651, "step": 31738 }, { "epoch": 0.96, "learning_rate": 2.5183567424443554e-08, "loss": 1.0018, "step": 31739 }, { "epoch": 0.96, "learning_rate": 2.5149044587007564e-08, "loss": 0.9858, "step": 31740 }, { "epoch": 0.96, "learning_rate": 2.511454530896046e-08, "loss": 1.0278, "step": 31741 }, { "epoch": 0.96, "learning_rate": 2.508006959063114e-08, "loss": 1.1755, "step": 31742 }, { "epoch": 0.96, "learning_rate": 2.504561743234768e-08, "loss": 1.0969, "step": 31743 }, { "epoch": 0.96, "learning_rate": 2.501118883443787e-08, "loss": 1.0486, "step": 31744 }, { "epoch": 0.96, "learning_rate": 2.497678379722951e-08, "loss": 1.09, "step": 31745 }, { "epoch": 0.96, "learning_rate": 2.4942402321050384e-08, "loss": 1.0377, "step": 31746 }, { "epoch": 0.96, "learning_rate": 2.4908044406227182e-08, "loss": 1.1124, "step": 31747 }, { "epoch": 0.96, "learning_rate": 2.4873710053087418e-08, "loss": 1.0762, "step": 31748 }, { "epoch": 0.96, "learning_rate": 2.483939926195833e-08, "loss": 1.0595, "step": 31749 }, { "epoch": 0.96, "learning_rate": 2.480511203316577e-08, "loss": 0.9999, "step": 31750 }, { "epoch": 0.96, "learning_rate": 2.4770848367036136e-08, "loss": 1.1481, "step": 31751 }, { "epoch": 0.96, "learning_rate": 2.47366082638964e-08, "loss": 1.0366, "step": 31752 }, { "epoch": 0.96, "learning_rate": 2.4702391724071852e-08, "loss": 1.0785, "step": 31753 }, { "epoch": 0.96, "learning_rate": 2.466819874788834e-08, "loss": 1.1629, "step": 31754 }, { "epoch": 0.96, "learning_rate": 2.4634029335671438e-08, "loss": 1.1249, "step": 31755 }, { "epoch": 0.96, "learning_rate": 2.4599883487746447e-08, "loss": 1.1742, "step": 31756 }, { "epoch": 0.96, "learning_rate": 2.4565761204438098e-08, "loss": 1.1256, "step": 31757 }, { "epoch": 0.96, "learning_rate": 2.4531662486071695e-08, "loss": 1.1662, "step": 31758 }, { "epoch": 0.96, "learning_rate": 2.4497587332971695e-08, "loss": 1.177, "step": 31759 }, { "epoch": 0.96, "learning_rate": 2.4463535745462286e-08, "loss": 1.1479, "step": 31760 }, { "epoch": 0.96, "learning_rate": 2.442950772386793e-08, "loss": 1.0605, "step": 31761 }, { "epoch": 0.96, "learning_rate": 2.4395503268512534e-08, "loss": 1.1359, "step": 31762 }, { "epoch": 0.96, "learning_rate": 2.436152237971945e-08, "loss": 1.1656, "step": 31763 }, { "epoch": 0.96, "learning_rate": 2.4327565057812306e-08, "loss": 1.0228, "step": 31764 }, { "epoch": 0.96, "learning_rate": 2.4293631303114463e-08, "loss": 1.0923, "step": 31765 }, { "epoch": 0.96, "learning_rate": 2.4259721115948987e-08, "loss": 1.0938, "step": 31766 }, { "epoch": 0.96, "learning_rate": 2.42258344966384e-08, "loss": 0.996, "step": 31767 }, { "epoch": 0.96, "learning_rate": 2.4191971445505502e-08, "loss": 1.1548, "step": 31768 }, { "epoch": 0.96, "learning_rate": 2.415813196287281e-08, "loss": 1.1227, "step": 31769 }, { "epoch": 0.96, "learning_rate": 2.412431604906257e-08, "loss": 0.9696, "step": 31770 }, { "epoch": 0.96, "learning_rate": 2.4090523704395908e-08, "loss": 1.1255, "step": 31771 }, { "epoch": 0.96, "learning_rate": 2.4056754929195348e-08, "loss": 1.1639, "step": 31772 }, { "epoch": 0.96, "learning_rate": 2.402300972378174e-08, "loss": 1.098, "step": 31773 }, { "epoch": 0.96, "learning_rate": 2.398928808847678e-08, "loss": 1.0319, "step": 31774 }, { "epoch": 0.96, "learning_rate": 2.3955590023601317e-08, "loss": 1.0366, "step": 31775 }, { "epoch": 0.96, "learning_rate": 2.3921915529476203e-08, "loss": 1.0184, "step": 31776 }, { "epoch": 0.96, "learning_rate": 2.388826460642174e-08, "loss": 1.0647, "step": 31777 }, { "epoch": 0.96, "learning_rate": 2.3854637254758507e-08, "loss": 1.0486, "step": 31778 }, { "epoch": 0.96, "learning_rate": 2.38210334748068e-08, "loss": 1.089, "step": 31779 }, { "epoch": 0.96, "learning_rate": 2.3787453266886084e-08, "loss": 1.1443, "step": 31780 }, { "epoch": 0.96, "learning_rate": 2.375389663131611e-08, "loss": 1.0604, "step": 31781 }, { "epoch": 0.96, "learning_rate": 2.3720363568416616e-08, "loss": 1.0558, "step": 31782 }, { "epoch": 0.96, "learning_rate": 2.3686854078506516e-08, "loss": 1.0303, "step": 31783 }, { "epoch": 0.96, "learning_rate": 2.3653368161905e-08, "loss": 1.0609, "step": 31784 }, { "epoch": 0.96, "learning_rate": 2.3619905818930977e-08, "loss": 1.0045, "step": 31785 }, { "epoch": 0.96, "learning_rate": 2.358646704990253e-08, "loss": 1.1207, "step": 31786 }, { "epoch": 0.96, "learning_rate": 2.3553051855138287e-08, "loss": 1.1042, "step": 31787 }, { "epoch": 0.96, "learning_rate": 2.351966023495633e-08, "loss": 1.1028, "step": 31788 }, { "epoch": 0.96, "learning_rate": 2.3486292189674463e-08, "loss": 1.119, "step": 31789 }, { "epoch": 0.96, "learning_rate": 2.3452947719610487e-08, "loss": 1.0527, "step": 31790 }, { "epoch": 0.96, "learning_rate": 2.3419626825081642e-08, "loss": 1.1265, "step": 31791 }, { "epoch": 0.96, "learning_rate": 2.338632950640518e-08, "loss": 1.0846, "step": 31792 }, { "epoch": 0.96, "learning_rate": 2.3353055763898068e-08, "loss": 1.1589, "step": 31793 }, { "epoch": 0.96, "learning_rate": 2.3319805597877e-08, "loss": 1.1172, "step": 31794 }, { "epoch": 0.96, "learning_rate": 2.3286579008658662e-08, "loss": 1.0708, "step": 31795 }, { "epoch": 0.96, "learning_rate": 2.325337599655919e-08, "loss": 0.9686, "step": 31796 }, { "epoch": 0.96, "learning_rate": 2.3220196561894726e-08, "loss": 1.137, "step": 31797 }, { "epoch": 0.96, "learning_rate": 2.3187040704981122e-08, "loss": 1.0631, "step": 31798 }, { "epoch": 0.96, "learning_rate": 2.3153908426134243e-08, "loss": 1.04, "step": 31799 }, { "epoch": 0.96, "learning_rate": 2.3120799725669108e-08, "loss": 1.014, "step": 31800 }, { "epoch": 0.96, "learning_rate": 2.3087714603901023e-08, "loss": 1.1254, "step": 31801 }, { "epoch": 0.96, "learning_rate": 2.3054653061145014e-08, "loss": 0.9883, "step": 31802 }, { "epoch": 0.96, "learning_rate": 2.3021615097715556e-08, "loss": 1.1813, "step": 31803 }, { "epoch": 0.96, "learning_rate": 2.2988600713927665e-08, "loss": 1.0179, "step": 31804 }, { "epoch": 0.96, "learning_rate": 2.2955609910095267e-08, "loss": 1.1458, "step": 31805 }, { "epoch": 0.96, "learning_rate": 2.2922642686532546e-08, "loss": 1.024, "step": 31806 }, { "epoch": 0.96, "learning_rate": 2.288969904355315e-08, "loss": 1.1123, "step": 31807 }, { "epoch": 0.96, "learning_rate": 2.2856778981470707e-08, "loss": 1.0854, "step": 31808 }, { "epoch": 0.96, "learning_rate": 2.282388250059886e-08, "loss": 1.0739, "step": 31809 }, { "epoch": 0.96, "learning_rate": 2.2791009601250414e-08, "loss": 1.1544, "step": 31810 }, { "epoch": 0.96, "learning_rate": 2.275816028373873e-08, "loss": 1.1934, "step": 31811 }, { "epoch": 0.96, "learning_rate": 2.2725334548376056e-08, "loss": 1.0723, "step": 31812 }, { "epoch": 0.96, "learning_rate": 2.2692532395475196e-08, "loss": 1.0875, "step": 31813 }, { "epoch": 0.96, "learning_rate": 2.2659753825348407e-08, "loss": 1.106, "step": 31814 }, { "epoch": 0.96, "learning_rate": 2.262699883830738e-08, "loss": 1.0778, "step": 31815 }, { "epoch": 0.96, "learning_rate": 2.2594267434664363e-08, "loss": 1.1612, "step": 31816 }, { "epoch": 0.96, "learning_rate": 2.2561559614730775e-08, "loss": 1.0935, "step": 31817 }, { "epoch": 0.96, "learning_rate": 2.2528875378818038e-08, "loss": 1.2379, "step": 31818 }, { "epoch": 0.96, "learning_rate": 2.249621472723701e-08, "loss": 1.1469, "step": 31819 }, { "epoch": 0.96, "learning_rate": 2.2463577660299107e-08, "loss": 1.114, "step": 31820 }, { "epoch": 0.96, "learning_rate": 2.2430964178314364e-08, "loss": 1.0223, "step": 31821 }, { "epoch": 0.96, "learning_rate": 2.2398374281593916e-08, "loss": 1.0864, "step": 31822 }, { "epoch": 0.96, "learning_rate": 2.2365807970447518e-08, "loss": 0.9598, "step": 31823 }, { "epoch": 0.96, "learning_rate": 2.2333265245185476e-08, "loss": 1.2079, "step": 31824 }, { "epoch": 0.96, "learning_rate": 2.2300746106117264e-08, "loss": 1.0983, "step": 31825 }, { "epoch": 0.96, "learning_rate": 2.2268250553552917e-08, "loss": 1.1781, "step": 31826 }, { "epoch": 0.96, "learning_rate": 2.223577858780135e-08, "loss": 1.1637, "step": 31827 }, { "epoch": 0.96, "learning_rate": 2.220333020917176e-08, "loss": 1.0553, "step": 31828 }, { "epoch": 0.96, "learning_rate": 2.2170905417973066e-08, "loss": 1.0928, "step": 31829 }, { "epoch": 0.96, "learning_rate": 2.213850421451419e-08, "loss": 1.0936, "step": 31830 }, { "epoch": 0.96, "learning_rate": 2.2106126599103495e-08, "loss": 1.2167, "step": 31831 }, { "epoch": 0.96, "learning_rate": 2.207377257204879e-08, "loss": 1.041, "step": 31832 }, { "epoch": 0.96, "learning_rate": 2.204144213365844e-08, "loss": 1.0895, "step": 31833 }, { "epoch": 0.96, "learning_rate": 2.2009135284240258e-08, "loss": 1.0339, "step": 31834 }, { "epoch": 0.96, "learning_rate": 2.197685202410149e-08, "loss": 1.1979, "step": 31835 }, { "epoch": 0.96, "learning_rate": 2.1944592353549677e-08, "loss": 1.1772, "step": 31836 }, { "epoch": 0.96, "learning_rate": 2.1912356272892064e-08, "loss": 1.1994, "step": 31837 }, { "epoch": 0.96, "learning_rate": 2.1880143782435082e-08, "loss": 1.0767, "step": 31838 }, { "epoch": 0.96, "learning_rate": 2.18479548824857e-08, "loss": 1.0537, "step": 31839 }, { "epoch": 0.96, "learning_rate": 2.1815789573350342e-08, "loss": 1.014, "step": 31840 }, { "epoch": 0.96, "learning_rate": 2.1783647855334878e-08, "loss": 1.0934, "step": 31841 }, { "epoch": 0.96, "learning_rate": 2.1751529728745723e-08, "loss": 1.0753, "step": 31842 }, { "epoch": 0.96, "learning_rate": 2.1719435193888473e-08, "loss": 1.0972, "step": 31843 }, { "epoch": 0.96, "learning_rate": 2.168736425106871e-08, "loss": 1.1929, "step": 31844 }, { "epoch": 0.96, "learning_rate": 2.165531690059147e-08, "loss": 1.0897, "step": 31845 }, { "epoch": 0.96, "learning_rate": 2.1623293142762068e-08, "loss": 1.0452, "step": 31846 }, { "epoch": 0.96, "learning_rate": 2.159129297788526e-08, "loss": 1.0808, "step": 31847 }, { "epoch": 0.96, "learning_rate": 2.1559316406265797e-08, "loss": 1.1884, "step": 31848 }, { "epoch": 0.96, "learning_rate": 2.1527363428207883e-08, "loss": 1.1063, "step": 31849 }, { "epoch": 0.96, "learning_rate": 2.1495434044015717e-08, "loss": 1.1074, "step": 31850 }, { "epoch": 0.96, "learning_rate": 2.1463528253993504e-08, "loss": 1.0664, "step": 31851 }, { "epoch": 0.96, "learning_rate": 2.143164605844489e-08, "loss": 1.0296, "step": 31852 }, { "epoch": 0.96, "learning_rate": 2.1399787457673237e-08, "loss": 1.0817, "step": 31853 }, { "epoch": 0.96, "learning_rate": 2.1367952451981646e-08, "loss": 1.1354, "step": 31854 }, { "epoch": 0.96, "learning_rate": 2.1336141041673474e-08, "loss": 1.0511, "step": 31855 }, { "epoch": 0.96, "learning_rate": 2.1304353227051542e-08, "loss": 1.1094, "step": 31856 }, { "epoch": 0.96, "learning_rate": 2.127258900841839e-08, "loss": 1.071, "step": 31857 }, { "epoch": 0.96, "learning_rate": 2.1240848386076263e-08, "loss": 1.0695, "step": 31858 }, { "epoch": 0.96, "learning_rate": 2.1209131360327707e-08, "loss": 1.0689, "step": 31859 }, { "epoch": 0.96, "learning_rate": 2.1177437931474143e-08, "loss": 1.0538, "step": 31860 }, { "epoch": 0.96, "learning_rate": 2.1145768099817832e-08, "loss": 1.0847, "step": 31861 }, { "epoch": 0.96, "learning_rate": 2.1114121865659644e-08, "loss": 1.1577, "step": 31862 }, { "epoch": 0.96, "learning_rate": 2.108249922930128e-08, "loss": 1.0826, "step": 31863 }, { "epoch": 0.96, "learning_rate": 2.1050900191043334e-08, "loss": 1.0432, "step": 31864 }, { "epoch": 0.96, "learning_rate": 2.101932475118723e-08, "loss": 1.0876, "step": 31865 }, { "epoch": 0.96, "learning_rate": 2.098777291003329e-08, "loss": 1.018, "step": 31866 }, { "epoch": 0.96, "learning_rate": 2.0956244667881542e-08, "loss": 1.0882, "step": 31867 }, { "epoch": 0.96, "learning_rate": 2.0924740025032587e-08, "loss": 1.1143, "step": 31868 }, { "epoch": 0.96, "learning_rate": 2.0893258981786178e-08, "loss": 1.1682, "step": 31869 }, { "epoch": 0.96, "learning_rate": 2.0861801538441806e-08, "loss": 1.0965, "step": 31870 }, { "epoch": 0.96, "learning_rate": 2.0830367695299224e-08, "loss": 1.0775, "step": 31871 }, { "epoch": 0.96, "learning_rate": 2.0798957452657642e-08, "loss": 1.1887, "step": 31872 }, { "epoch": 0.96, "learning_rate": 2.0767570810815707e-08, "loss": 1.1491, "step": 31873 }, { "epoch": 0.96, "learning_rate": 2.0736207770072627e-08, "loss": 1.231, "step": 31874 }, { "epoch": 0.96, "learning_rate": 2.0704868330726767e-08, "loss": 1.0624, "step": 31875 }, { "epoch": 0.96, "learning_rate": 2.067355249307651e-08, "loss": 1.0099, "step": 31876 }, { "epoch": 0.96, "learning_rate": 2.0642260257419666e-08, "loss": 1.1058, "step": 31877 }, { "epoch": 0.96, "learning_rate": 2.0610991624054888e-08, "loss": 1.0771, "step": 31878 }, { "epoch": 0.96, "learning_rate": 2.057974659327916e-08, "loss": 1.1519, "step": 31879 }, { "epoch": 0.96, "learning_rate": 2.054852516539002e-08, "loss": 1.0767, "step": 31880 }, { "epoch": 0.96, "learning_rate": 2.0517327340684734e-08, "loss": 1.1049, "step": 31881 }, { "epoch": 0.96, "learning_rate": 2.0486153119460284e-08, "loss": 1.1035, "step": 31882 }, { "epoch": 0.96, "learning_rate": 2.0455002502013933e-08, "loss": 1.0848, "step": 31883 }, { "epoch": 0.96, "learning_rate": 2.0423875488641275e-08, "loss": 1.0679, "step": 31884 }, { "epoch": 0.96, "learning_rate": 2.03927720796393e-08, "loss": 1.0948, "step": 31885 }, { "epoch": 0.96, "learning_rate": 2.0361692275303878e-08, "loss": 1.2048, "step": 31886 }, { "epoch": 0.96, "learning_rate": 2.0330636075931165e-08, "loss": 1.0214, "step": 31887 }, { "epoch": 0.96, "learning_rate": 2.02996034818162e-08, "loss": 1.0322, "step": 31888 }, { "epoch": 0.96, "learning_rate": 2.0268594493254857e-08, "loss": 1.0514, "step": 31889 }, { "epoch": 0.96, "learning_rate": 2.0237609110542177e-08, "loss": 1.1187, "step": 31890 }, { "epoch": 0.96, "learning_rate": 2.0206647333973206e-08, "loss": 1.079, "step": 31891 }, { "epoch": 0.96, "learning_rate": 2.0175709163842706e-08, "loss": 1.132, "step": 31892 }, { "epoch": 0.96, "learning_rate": 2.0144794600445162e-08, "loss": 1.1084, "step": 31893 }, { "epoch": 0.96, "learning_rate": 2.0113903644074505e-08, "loss": 1.0158, "step": 31894 }, { "epoch": 0.96, "learning_rate": 2.0083036295025503e-08, "loss": 1.1478, "step": 31895 }, { "epoch": 0.96, "learning_rate": 2.0052192553591533e-08, "loss": 1.038, "step": 31896 }, { "epoch": 0.96, "learning_rate": 2.0021372420066244e-08, "loss": 1.0844, "step": 31897 }, { "epoch": 0.96, "learning_rate": 1.9990575894743015e-08, "loss": 1.136, "step": 31898 }, { "epoch": 0.96, "learning_rate": 1.9959802977915222e-08, "loss": 1.332, "step": 31899 }, { "epoch": 0.96, "learning_rate": 1.9929053669875685e-08, "loss": 0.9763, "step": 31900 }, { "epoch": 0.96, "learning_rate": 1.9898327970916954e-08, "loss": 1.1094, "step": 31901 }, { "epoch": 0.96, "learning_rate": 1.9867625881331842e-08, "loss": 1.058, "step": 31902 }, { "epoch": 0.96, "learning_rate": 1.9836947401412342e-08, "loss": 1.0496, "step": 31903 }, { "epoch": 0.96, "learning_rate": 1.980629253145072e-08, "loss": 0.9893, "step": 31904 }, { "epoch": 0.96, "learning_rate": 1.977566127173869e-08, "loss": 1.0909, "step": 31905 }, { "epoch": 0.96, "learning_rate": 1.9745053622567955e-08, "loss": 1.0336, "step": 31906 }, { "epoch": 0.96, "learning_rate": 1.9714469584229402e-08, "loss": 1.08, "step": 31907 }, { "epoch": 0.96, "learning_rate": 1.9683909157015014e-08, "loss": 1.1104, "step": 31908 }, { "epoch": 0.96, "learning_rate": 1.9653372341215116e-08, "loss": 1.0386, "step": 31909 }, { "epoch": 0.96, "learning_rate": 1.962285913712031e-08, "loss": 1.0847, "step": 31910 }, { "epoch": 0.96, "learning_rate": 1.9592369545021473e-08, "loss": 1.0859, "step": 31911 }, { "epoch": 0.96, "learning_rate": 1.956190356520865e-08, "loss": 1.1769, "step": 31912 }, { "epoch": 0.96, "learning_rate": 1.953146119797189e-08, "loss": 1.0599, "step": 31913 }, { "epoch": 0.96, "learning_rate": 1.950104244360096e-08, "loss": 1.054, "step": 31914 }, { "epoch": 0.96, "learning_rate": 1.947064730238535e-08, "loss": 1.044, "step": 31915 }, { "epoch": 0.96, "learning_rate": 1.9440275774614548e-08, "loss": 1.1354, "step": 31916 }, { "epoch": 0.96, "learning_rate": 1.940992786057805e-08, "loss": 1.108, "step": 31917 }, { "epoch": 0.96, "learning_rate": 1.9379603560563954e-08, "loss": 1.2739, "step": 31918 }, { "epoch": 0.96, "learning_rate": 1.93493028748612e-08, "loss": 1.0206, "step": 31919 }, { "epoch": 0.96, "learning_rate": 1.9319025803758716e-08, "loss": 1.2145, "step": 31920 }, { "epoch": 0.96, "learning_rate": 1.928877234754406e-08, "loss": 1.0945, "step": 31921 }, { "epoch": 0.96, "learning_rate": 1.9258542506505605e-08, "loss": 1.1652, "step": 31922 }, { "epoch": 0.96, "learning_rate": 1.9228336280931182e-08, "loss": 1.1274, "step": 31923 }, { "epoch": 0.96, "learning_rate": 1.9198153671108056e-08, "loss": 1.255, "step": 31924 }, { "epoch": 0.96, "learning_rate": 1.9167994677323777e-08, "loss": 1.1488, "step": 31925 }, { "epoch": 0.96, "learning_rate": 1.9137859299865612e-08, "loss": 1.0657, "step": 31926 }, { "epoch": 0.96, "learning_rate": 1.9107747539020004e-08, "loss": 1.0454, "step": 31927 }, { "epoch": 0.96, "learning_rate": 1.9077659395073667e-08, "loss": 1.0453, "step": 31928 }, { "epoch": 0.96, "learning_rate": 1.9047594868313313e-08, "loss": 1.2059, "step": 31929 }, { "epoch": 0.96, "learning_rate": 1.9017553959025104e-08, "loss": 1.0659, "step": 31930 }, { "epoch": 0.96, "learning_rate": 1.8987536667494645e-08, "loss": 1.0958, "step": 31931 }, { "epoch": 0.96, "learning_rate": 1.8957542994008092e-08, "loss": 1.0786, "step": 31932 }, { "epoch": 0.96, "learning_rate": 1.892757293885078e-08, "loss": 1.077, "step": 31933 }, { "epoch": 0.96, "learning_rate": 1.8897626502308032e-08, "loss": 1.0532, "step": 31934 }, { "epoch": 0.96, "learning_rate": 1.8867703684665174e-08, "loss": 1.1161, "step": 31935 }, { "epoch": 0.96, "learning_rate": 1.8837804486206702e-08, "loss": 1.0974, "step": 31936 }, { "epoch": 0.96, "learning_rate": 1.880792890721711e-08, "loss": 1.243, "step": 31937 }, { "epoch": 0.96, "learning_rate": 1.877807694798117e-08, "loss": 1.1342, "step": 31938 }, { "epoch": 0.96, "learning_rate": 1.8748248608783103e-08, "loss": 1.2192, "step": 31939 }, { "epoch": 0.96, "learning_rate": 1.8718443889906567e-08, "loss": 1.0419, "step": 31940 }, { "epoch": 0.96, "learning_rate": 1.8688662791635504e-08, "loss": 0.9777, "step": 31941 }, { "epoch": 0.96, "learning_rate": 1.8658905314253294e-08, "loss": 1.1228, "step": 31942 }, { "epoch": 0.96, "learning_rate": 1.8629171458043326e-08, "loss": 1.1687, "step": 31943 }, { "epoch": 0.96, "learning_rate": 1.8599461223288428e-08, "loss": 1.144, "step": 31944 }, { "epoch": 0.96, "learning_rate": 1.856977461027143e-08, "loss": 1.0472, "step": 31945 }, { "epoch": 0.96, "learning_rate": 1.8540111619275438e-08, "loss": 1.1274, "step": 31946 }, { "epoch": 0.96, "learning_rate": 1.8510472250582167e-08, "loss": 1.1154, "step": 31947 }, { "epoch": 0.96, "learning_rate": 1.8480856504474178e-08, "loss": 1.1072, "step": 31948 }, { "epoch": 0.96, "learning_rate": 1.845126438123318e-08, "loss": 1.1812, "step": 31949 }, { "epoch": 0.96, "learning_rate": 1.8421695881141455e-08, "loss": 1.1703, "step": 31950 }, { "epoch": 0.96, "learning_rate": 1.839215100447961e-08, "loss": 1.0826, "step": 31951 }, { "epoch": 0.96, "learning_rate": 1.8362629751529358e-08, "loss": 0.9662, "step": 31952 }, { "epoch": 0.96, "learning_rate": 1.8333132122571595e-08, "loss": 0.9956, "step": 31953 }, { "epoch": 0.96, "learning_rate": 1.8303658117887478e-08, "loss": 1.1172, "step": 31954 }, { "epoch": 0.96, "learning_rate": 1.8274207737757066e-08, "loss": 1.1382, "step": 31955 }, { "epoch": 0.96, "learning_rate": 1.8244780982460964e-08, "loss": 1.2294, "step": 31956 }, { "epoch": 0.96, "learning_rate": 1.8215377852279505e-08, "loss": 0.9738, "step": 31957 }, { "epoch": 0.96, "learning_rate": 1.8185998347492184e-08, "loss": 1.0576, "step": 31958 }, { "epoch": 0.96, "learning_rate": 1.8156642468378783e-08, "loss": 1.0543, "step": 31959 }, { "epoch": 0.96, "learning_rate": 1.8127310215219075e-08, "loss": 1.0685, "step": 31960 }, { "epoch": 0.96, "learning_rate": 1.8098001588292e-08, "loss": 1.0787, "step": 31961 }, { "epoch": 0.96, "learning_rate": 1.8068716587876788e-08, "loss": 1.0883, "step": 31962 }, { "epoch": 0.96, "learning_rate": 1.8039455214251822e-08, "loss": 1.0016, "step": 31963 }, { "epoch": 0.96, "learning_rate": 1.8010217467695767e-08, "loss": 1.1055, "step": 31964 }, { "epoch": 0.96, "learning_rate": 1.798100334848757e-08, "loss": 1.0422, "step": 31965 }, { "epoch": 0.96, "learning_rate": 1.7951812856904505e-08, "loss": 1.1104, "step": 31966 }, { "epoch": 0.96, "learning_rate": 1.7922645993224687e-08, "loss": 1.0872, "step": 31967 }, { "epoch": 0.96, "learning_rate": 1.7893502757725944e-08, "loss": 1.1361, "step": 31968 }, { "epoch": 0.96, "learning_rate": 1.7864383150685838e-08, "loss": 1.1047, "step": 31969 }, { "epoch": 0.96, "learning_rate": 1.7835287172381087e-08, "loss": 1.1389, "step": 31970 }, { "epoch": 0.96, "learning_rate": 1.7806214823088973e-08, "loss": 1.172, "step": 31971 }, { "epoch": 0.96, "learning_rate": 1.7777166103086495e-08, "loss": 1.1572, "step": 31972 }, { "epoch": 0.96, "learning_rate": 1.7748141012649544e-08, "loss": 1.1295, "step": 31973 }, { "epoch": 0.96, "learning_rate": 1.771913955205512e-08, "loss": 1.2395, "step": 31974 }, { "epoch": 0.96, "learning_rate": 1.7690161721578835e-08, "loss": 1.119, "step": 31975 }, { "epoch": 0.96, "learning_rate": 1.766120752149686e-08, "loss": 1.1139, "step": 31976 }, { "epoch": 0.96, "learning_rate": 1.7632276952084247e-08, "loss": 1.042, "step": 31977 }, { "epoch": 0.96, "learning_rate": 1.760337001361717e-08, "loss": 1.0476, "step": 31978 }, { "epoch": 0.96, "learning_rate": 1.757448670637041e-08, "loss": 1.0922, "step": 31979 }, { "epoch": 0.96, "learning_rate": 1.754562703061874e-08, "loss": 1.1752, "step": 31980 }, { "epoch": 0.96, "learning_rate": 1.751679098663722e-08, "loss": 1.2185, "step": 31981 }, { "epoch": 0.96, "learning_rate": 1.748797857470036e-08, "loss": 1.0767, "step": 31982 }, { "epoch": 0.96, "learning_rate": 1.7459189795082377e-08, "loss": 1.0856, "step": 31983 }, { "epoch": 0.96, "learning_rate": 1.743042464805694e-08, "loss": 1.0602, "step": 31984 }, { "epoch": 0.96, "learning_rate": 1.7401683133898562e-08, "loss": 1.0485, "step": 31985 }, { "epoch": 0.96, "learning_rate": 1.7372965252880348e-08, "loss": 1.0984, "step": 31986 }, { "epoch": 0.96, "learning_rate": 1.734427100527597e-08, "loss": 1.0944, "step": 31987 }, { "epoch": 0.96, "learning_rate": 1.7315600391358268e-08, "loss": 1.1652, "step": 31988 }, { "epoch": 0.96, "learning_rate": 1.7286953411400355e-08, "loss": 1.0342, "step": 31989 }, { "epoch": 0.96, "learning_rate": 1.725833006567479e-08, "loss": 1.0493, "step": 31990 }, { "epoch": 0.96, "learning_rate": 1.7229730354454687e-08, "loss": 0.9794, "step": 31991 }, { "epoch": 0.96, "learning_rate": 1.7201154278011502e-08, "loss": 1.0703, "step": 31992 }, { "epoch": 0.96, "learning_rate": 1.717260183661751e-08, "loss": 1.0901, "step": 31993 }, { "epoch": 0.96, "learning_rate": 1.714407303054444e-08, "loss": 1.1056, "step": 31994 }, { "epoch": 0.96, "learning_rate": 1.7115567860064298e-08, "loss": 1.1573, "step": 31995 }, { "epoch": 0.96, "learning_rate": 1.7087086325447975e-08, "loss": 1.0023, "step": 31996 }, { "epoch": 0.96, "learning_rate": 1.7058628426966926e-08, "loss": 1.0665, "step": 31997 }, { "epoch": 0.96, "learning_rate": 1.7030194164891768e-08, "loss": 1.0176, "step": 31998 }, { "epoch": 0.96, "learning_rate": 1.700178353949339e-08, "loss": 1.1334, "step": 31999 }, { "epoch": 0.96, "learning_rate": 1.697339655104241e-08, "loss": 1.0538, "step": 32000 }, { "epoch": 0.96, "learning_rate": 1.6945033199808615e-08, "loss": 1.1263, "step": 32001 }, { "epoch": 0.96, "learning_rate": 1.6916693486062065e-08, "loss": 1.0593, "step": 32002 }, { "epoch": 0.96, "learning_rate": 1.688837741007282e-08, "loss": 1.1087, "step": 32003 }, { "epoch": 0.96, "learning_rate": 1.6860084972110392e-08, "loss": 0.963, "step": 32004 }, { "epoch": 0.96, "learning_rate": 1.6831816172444006e-08, "loss": 1.1, "step": 32005 }, { "epoch": 0.96, "learning_rate": 1.6803571011342613e-08, "loss": 1.0673, "step": 32006 }, { "epoch": 0.96, "learning_rate": 1.6775349489075442e-08, "loss": 1.1176, "step": 32007 }, { "epoch": 0.96, "learning_rate": 1.674715160591117e-08, "loss": 1.1547, "step": 32008 }, { "epoch": 0.96, "learning_rate": 1.6718977362117916e-08, "loss": 1.1432, "step": 32009 }, { "epoch": 0.96, "learning_rate": 1.6690826757963798e-08, "loss": 1.1175, "step": 32010 }, { "epoch": 0.96, "learning_rate": 1.6662699793717208e-08, "loss": 1.1069, "step": 32011 }, { "epoch": 0.96, "learning_rate": 1.6634596469645713e-08, "loss": 1.1921, "step": 32012 }, { "epoch": 0.96, "learning_rate": 1.6606516786016604e-08, "loss": 1.1487, "step": 32013 }, { "epoch": 0.96, "learning_rate": 1.6578460743097712e-08, "loss": 1.0002, "step": 32014 }, { "epoch": 0.96, "learning_rate": 1.65504283411555e-08, "loss": 1.0417, "step": 32015 }, { "epoch": 0.96, "learning_rate": 1.6522419580457248e-08, "loss": 1.1084, "step": 32016 }, { "epoch": 0.96, "learning_rate": 1.6494434461269693e-08, "loss": 1.1546, "step": 32017 }, { "epoch": 0.96, "learning_rate": 1.6466472983858727e-08, "loss": 1.2616, "step": 32018 }, { "epoch": 0.96, "learning_rate": 1.6438535148491086e-08, "loss": 1.1478, "step": 32019 }, { "epoch": 0.96, "learning_rate": 1.6410620955432388e-08, "loss": 1.0852, "step": 32020 }, { "epoch": 0.96, "learning_rate": 1.6382730404948534e-08, "loss": 1.082, "step": 32021 }, { "epoch": 0.96, "learning_rate": 1.6354863497304583e-08, "loss": 1.0094, "step": 32022 }, { "epoch": 0.96, "learning_rate": 1.6327020232766445e-08, "loss": 1.071, "step": 32023 }, { "epoch": 0.96, "learning_rate": 1.62992006115989e-08, "loss": 1.186, "step": 32024 }, { "epoch": 0.96, "learning_rate": 1.6271404634066733e-08, "loss": 1.0869, "step": 32025 }, { "epoch": 0.96, "learning_rate": 1.6243632300434465e-08, "loss": 1.1717, "step": 32026 }, { "epoch": 0.96, "learning_rate": 1.6215883610966877e-08, "loss": 1.0798, "step": 32027 }, { "epoch": 0.96, "learning_rate": 1.6188158565927646e-08, "loss": 1.0447, "step": 32028 }, { "epoch": 0.96, "learning_rate": 1.6160457165580734e-08, "loss": 1.1249, "step": 32029 }, { "epoch": 0.96, "learning_rate": 1.6132779410190368e-08, "loss": 1.1124, "step": 32030 }, { "epoch": 0.96, "learning_rate": 1.61051253000194e-08, "loss": 1.1762, "step": 32031 }, { "epoch": 0.96, "learning_rate": 1.60774948353315e-08, "loss": 1.0841, "step": 32032 }, { "epoch": 0.96, "learning_rate": 1.6049888016389514e-08, "loss": 1.1623, "step": 32033 }, { "epoch": 0.97, "learning_rate": 1.6022304843456295e-08, "loss": 1.1883, "step": 32034 }, { "epoch": 0.97, "learning_rate": 1.5994745316794402e-08, "loss": 1.1302, "step": 32035 }, { "epoch": 0.97, "learning_rate": 1.596720943666613e-08, "loss": 1.087, "step": 32036 }, { "epoch": 0.97, "learning_rate": 1.593969720333377e-08, "loss": 1.1425, "step": 32037 }, { "epoch": 0.97, "learning_rate": 1.5912208617059056e-08, "loss": 1.0977, "step": 32038 }, { "epoch": 0.97, "learning_rate": 1.588474367810372e-08, "loss": 1.0911, "step": 32039 }, { "epoch": 0.97, "learning_rate": 1.5857302386729222e-08, "loss": 1.0915, "step": 32040 }, { "epoch": 0.97, "learning_rate": 1.582988474319702e-08, "loss": 1.0597, "step": 32041 }, { "epoch": 0.97, "learning_rate": 1.580249074776774e-08, "loss": 1.1179, "step": 32042 }, { "epoch": 0.97, "learning_rate": 1.5775120400702282e-08, "loss": 1.1022, "step": 32043 }, { "epoch": 0.97, "learning_rate": 1.5747773702261272e-08, "loss": 1.0228, "step": 32044 }, { "epoch": 0.97, "learning_rate": 1.5720450652705056e-08, "loss": 1.1074, "step": 32045 }, { "epoch": 0.97, "learning_rate": 1.5693151252293702e-08, "loss": 1.0544, "step": 32046 }, { "epoch": 0.97, "learning_rate": 1.5665875501287008e-08, "loss": 1.0933, "step": 32047 }, { "epoch": 0.97, "learning_rate": 1.5638623399944487e-08, "loss": 1.0942, "step": 32048 }, { "epoch": 0.97, "learning_rate": 1.5611394948525927e-08, "loss": 1.1691, "step": 32049 }, { "epoch": 0.97, "learning_rate": 1.558419014729057e-08, "loss": 1.0988, "step": 32050 }, { "epoch": 0.97, "learning_rate": 1.5557008996496815e-08, "loss": 1.2502, "step": 32051 }, { "epoch": 0.97, "learning_rate": 1.552985149640418e-08, "loss": 1.1017, "step": 32052 }, { "epoch": 0.97, "learning_rate": 1.5502717647270516e-08, "loss": 1.05, "step": 32053 }, { "epoch": 0.97, "learning_rate": 1.5475607449354502e-08, "loss": 1.1097, "step": 32054 }, { "epoch": 0.97, "learning_rate": 1.5448520902913988e-08, "loss": 1.0856, "step": 32055 }, { "epoch": 0.97, "learning_rate": 1.54214580082071e-08, "loss": 1.1403, "step": 32056 }, { "epoch": 0.97, "learning_rate": 1.5394418765491136e-08, "loss": 1.1152, "step": 32057 }, { "epoch": 0.97, "learning_rate": 1.5367403175023944e-08, "loss": 1.0318, "step": 32058 }, { "epoch": 0.97, "learning_rate": 1.5340411237062257e-08, "loss": 1.0532, "step": 32059 }, { "epoch": 0.97, "learning_rate": 1.53134429518631e-08, "loss": 1.0895, "step": 32060 }, { "epoch": 0.97, "learning_rate": 1.5286498319683484e-08, "loss": 1.0398, "step": 32061 }, { "epoch": 0.97, "learning_rate": 1.5259577340779595e-08, "loss": 1.085, "step": 32062 }, { "epoch": 0.97, "learning_rate": 1.5232680015407895e-08, "loss": 1.1439, "step": 32063 }, { "epoch": 0.97, "learning_rate": 1.5205806343824568e-08, "loss": 1.1082, "step": 32064 }, { "epoch": 0.97, "learning_rate": 1.5178956326284965e-08, "loss": 1.094, "step": 32065 }, { "epoch": 0.97, "learning_rate": 1.515212996304527e-08, "loss": 1.1232, "step": 32066 }, { "epoch": 0.97, "learning_rate": 1.5125327254360278e-08, "loss": 1.0065, "step": 32067 }, { "epoch": 0.97, "learning_rate": 1.509854820048534e-08, "loss": 1.1743, "step": 32068 }, { "epoch": 0.97, "learning_rate": 1.507179280167581e-08, "loss": 1.1157, "step": 32069 }, { "epoch": 0.97, "learning_rate": 1.504506105818593e-08, "loss": 1.1152, "step": 32070 }, { "epoch": 0.97, "learning_rate": 1.501835297027021e-08, "loss": 1.0011, "step": 32071 }, { "epoch": 0.97, "learning_rate": 1.4991668538182903e-08, "loss": 1.0643, "step": 32072 }, { "epoch": 0.97, "learning_rate": 1.496500776217824e-08, "loss": 1.0869, "step": 32073 }, { "epoch": 0.97, "learning_rate": 1.4938370642509636e-08, "loss": 1.1469, "step": 32074 }, { "epoch": 0.97, "learning_rate": 1.4911757179431052e-08, "loss": 1.0876, "step": 32075 }, { "epoch": 0.97, "learning_rate": 1.4885167373195619e-08, "loss": 1.0998, "step": 32076 }, { "epoch": 0.97, "learning_rate": 1.4858601224056468e-08, "loss": 1.0242, "step": 32077 }, { "epoch": 0.97, "learning_rate": 1.483205873226673e-08, "loss": 1.0602, "step": 32078 }, { "epoch": 0.97, "learning_rate": 1.4805539898078702e-08, "loss": 1.0782, "step": 32079 }, { "epoch": 0.97, "learning_rate": 1.4779044721745239e-08, "loss": 1.1487, "step": 32080 }, { "epoch": 0.97, "learning_rate": 1.4752573203518083e-08, "loss": 1.0597, "step": 32081 }, { "epoch": 0.97, "learning_rate": 1.472612534364981e-08, "loss": 1.0057, "step": 32082 }, { "epoch": 0.97, "learning_rate": 1.4699701142391608e-08, "loss": 1.0619, "step": 32083 }, { "epoch": 0.97, "learning_rate": 1.4673300599995222e-08, "loss": 1.1573, "step": 32084 }, { "epoch": 0.97, "learning_rate": 1.4646923716712391e-08, "loss": 1.0385, "step": 32085 }, { "epoch": 0.97, "learning_rate": 1.4620570492793473e-08, "loss": 1.1613, "step": 32086 }, { "epoch": 0.97, "learning_rate": 1.4594240928489934e-08, "loss": 1.1075, "step": 32087 }, { "epoch": 0.97, "learning_rate": 1.4567935024052127e-08, "loss": 1.0654, "step": 32088 }, { "epoch": 0.97, "learning_rate": 1.4541652779730686e-08, "loss": 1.0614, "step": 32089 }, { "epoch": 0.97, "learning_rate": 1.4515394195775689e-08, "loss": 1.0916, "step": 32090 }, { "epoch": 0.97, "learning_rate": 1.4489159272436937e-08, "loss": 1.0786, "step": 32091 }, { "epoch": 0.97, "learning_rate": 1.4462948009964228e-08, "loss": 1.1717, "step": 32092 }, { "epoch": 0.97, "learning_rate": 1.4436760408607364e-08, "loss": 1.1342, "step": 32093 }, { "epoch": 0.97, "learning_rate": 1.441059646861559e-08, "loss": 1.0706, "step": 32094 }, { "epoch": 0.97, "learning_rate": 1.4384456190237594e-08, "loss": 1.0945, "step": 32095 }, { "epoch": 0.97, "learning_rate": 1.4358339573722624e-08, "loss": 1.097, "step": 32096 }, { "epoch": 0.97, "learning_rate": 1.433224661931909e-08, "loss": 1.0603, "step": 32097 }, { "epoch": 0.97, "learning_rate": 1.4306177327275129e-08, "loss": 1.2162, "step": 32098 }, { "epoch": 0.97, "learning_rate": 1.4280131697839705e-08, "loss": 1.1497, "step": 32099 }, { "epoch": 0.97, "learning_rate": 1.4254109731260123e-08, "loss": 1.1578, "step": 32100 }, { "epoch": 0.97, "learning_rate": 1.4228111427783964e-08, "loss": 1.1984, "step": 32101 }, { "epoch": 0.97, "learning_rate": 1.4202136787659082e-08, "loss": 1.1683, "step": 32102 }, { "epoch": 0.97, "learning_rate": 1.4176185811133059e-08, "loss": 1.0125, "step": 32103 }, { "epoch": 0.97, "learning_rate": 1.4150258498452086e-08, "loss": 1.0954, "step": 32104 }, { "epoch": 0.97, "learning_rate": 1.4124354849863465e-08, "loss": 1.1069, "step": 32105 }, { "epoch": 0.97, "learning_rate": 1.4098474865613942e-08, "loss": 1.1575, "step": 32106 }, { "epoch": 0.97, "learning_rate": 1.4072618545949435e-08, "loss": 0.9961, "step": 32107 }, { "epoch": 0.97, "learning_rate": 1.4046785891116687e-08, "loss": 1.1757, "step": 32108 }, { "epoch": 0.97, "learning_rate": 1.402097690136106e-08, "loss": 1.0636, "step": 32109 }, { "epoch": 0.97, "learning_rate": 1.3995191576928469e-08, "loss": 1.1542, "step": 32110 }, { "epoch": 0.97, "learning_rate": 1.396942991806427e-08, "loss": 1.1235, "step": 32111 }, { "epoch": 0.97, "learning_rate": 1.3943691925013824e-08, "loss": 1.1348, "step": 32112 }, { "epoch": 0.97, "learning_rate": 1.3917977598022215e-08, "loss": 1.0857, "step": 32113 }, { "epoch": 0.97, "learning_rate": 1.3892286937333965e-08, "loss": 1.0928, "step": 32114 }, { "epoch": 0.97, "learning_rate": 1.3866619943193882e-08, "loss": 1.0354, "step": 32115 }, { "epoch": 0.97, "learning_rate": 1.3840976615846213e-08, "loss": 0.9737, "step": 32116 }, { "epoch": 0.97, "learning_rate": 1.381535695553493e-08, "loss": 1.0978, "step": 32117 }, { "epoch": 0.97, "learning_rate": 1.3789760962504285e-08, "loss": 1.149, "step": 32118 }, { "epoch": 0.97, "learning_rate": 1.3764188636997688e-08, "loss": 1.0585, "step": 32119 }, { "epoch": 0.97, "learning_rate": 1.3738639979258561e-08, "loss": 1.0618, "step": 32120 }, { "epoch": 0.97, "learning_rate": 1.3713114989530041e-08, "loss": 1.1432, "step": 32121 }, { "epoch": 0.97, "learning_rate": 1.3687613668055267e-08, "loss": 1.1068, "step": 32122 }, { "epoch": 0.97, "learning_rate": 1.36621360150771e-08, "loss": 1.1393, "step": 32123 }, { "epoch": 0.97, "learning_rate": 1.3636682030837845e-08, "loss": 1.1648, "step": 32124 }, { "epoch": 0.97, "learning_rate": 1.3611251715580087e-08, "loss": 1.1105, "step": 32125 }, { "epoch": 0.97, "learning_rate": 1.35858450695453e-08, "loss": 1.0532, "step": 32126 }, { "epoch": 0.97, "learning_rate": 1.3560462092976067e-08, "loss": 1.0686, "step": 32127 }, { "epoch": 0.97, "learning_rate": 1.3535102786113584e-08, "loss": 1.0583, "step": 32128 }, { "epoch": 0.97, "learning_rate": 1.3509767149199604e-08, "loss": 1.0688, "step": 32129 }, { "epoch": 0.97, "learning_rate": 1.3484455182475042e-08, "loss": 1.0768, "step": 32130 }, { "epoch": 0.97, "learning_rate": 1.3459166886180818e-08, "loss": 1.1377, "step": 32131 }, { "epoch": 0.97, "learning_rate": 1.3433902260557851e-08, "loss": 1.0825, "step": 32132 }, { "epoch": 0.97, "learning_rate": 1.3408661305846505e-08, "loss": 1.0361, "step": 32133 }, { "epoch": 0.97, "learning_rate": 1.338344402228714e-08, "loss": 1.1267, "step": 32134 }, { "epoch": 0.97, "learning_rate": 1.3358250410119843e-08, "loss": 1.0638, "step": 32135 }, { "epoch": 0.97, "learning_rate": 1.3333080469584425e-08, "loss": 1.1736, "step": 32136 }, { "epoch": 0.97, "learning_rate": 1.3307934200920413e-08, "loss": 1.1288, "step": 32137 }, { "epoch": 0.97, "learning_rate": 1.3282811604367064e-08, "loss": 0.9785, "step": 32138 }, { "epoch": 0.97, "learning_rate": 1.3257712680163903e-08, "loss": 1.0768, "step": 32139 }, { "epoch": 0.97, "learning_rate": 1.3232637428549633e-08, "loss": 1.0818, "step": 32140 }, { "epoch": 0.97, "learning_rate": 1.320758584976295e-08, "loss": 1.0739, "step": 32141 }, { "epoch": 0.97, "learning_rate": 1.3182557944042273e-08, "loss": 1.1628, "step": 32142 }, { "epoch": 0.97, "learning_rate": 1.3157553711626026e-08, "loss": 1.0385, "step": 32143 }, { "epoch": 0.97, "learning_rate": 1.3132573152752349e-08, "loss": 1.1075, "step": 32144 }, { "epoch": 0.97, "learning_rate": 1.3107616267658552e-08, "loss": 1.1147, "step": 32145 }, { "epoch": 0.97, "learning_rate": 1.3082683056582779e-08, "loss": 1.041, "step": 32146 }, { "epoch": 0.97, "learning_rate": 1.3057773519762062e-08, "loss": 1.073, "step": 32147 }, { "epoch": 0.97, "learning_rate": 1.3032887657433435e-08, "loss": 1.1456, "step": 32148 }, { "epoch": 0.97, "learning_rate": 1.3008025469834207e-08, "loss": 1.1215, "step": 32149 }, { "epoch": 0.97, "learning_rate": 1.2983186957200578e-08, "loss": 1.1528, "step": 32150 }, { "epoch": 0.97, "learning_rate": 1.2958372119769303e-08, "loss": 1.0829, "step": 32151 }, { "epoch": 0.97, "learning_rate": 1.2933580957776581e-08, "loss": 1.1271, "step": 32152 }, { "epoch": 0.97, "learning_rate": 1.2908813471458337e-08, "loss": 1.1101, "step": 32153 }, { "epoch": 0.97, "learning_rate": 1.2884069661050213e-08, "loss": 1.1458, "step": 32154 }, { "epoch": 0.97, "learning_rate": 1.2859349526788133e-08, "loss": 1.1805, "step": 32155 }, { "epoch": 0.97, "learning_rate": 1.283465306890691e-08, "loss": 1.1041, "step": 32156 }, { "epoch": 0.97, "learning_rate": 1.2809980287642187e-08, "loss": 1.0511, "step": 32157 }, { "epoch": 0.97, "learning_rate": 1.27853311832285e-08, "loss": 0.9832, "step": 32158 }, { "epoch": 0.97, "learning_rate": 1.276070575590066e-08, "loss": 1.0811, "step": 32159 }, { "epoch": 0.97, "learning_rate": 1.2736104005892925e-08, "loss": 1.117, "step": 32160 }, { "epoch": 0.97, "learning_rate": 1.271152593343955e-08, "loss": 1.05, "step": 32161 }, { "epoch": 0.97, "learning_rate": 1.2686971538774517e-08, "loss": 1.0887, "step": 32162 }, { "epoch": 0.97, "learning_rate": 1.2662440822131528e-08, "loss": 1.0681, "step": 32163 }, { "epoch": 0.97, "learning_rate": 1.2637933783744282e-08, "loss": 1.1265, "step": 32164 }, { "epoch": 0.97, "learning_rate": 1.261345042384593e-08, "loss": 1.1147, "step": 32165 }, { "epoch": 0.97, "learning_rate": 1.2588990742669615e-08, "loss": 1.1238, "step": 32166 }, { "epoch": 0.97, "learning_rate": 1.2564554740447932e-08, "loss": 1.0611, "step": 32167 }, { "epoch": 0.97, "learning_rate": 1.2540142417413748e-08, "loss": 1.1816, "step": 32168 }, { "epoch": 0.97, "learning_rate": 1.2515753773799655e-08, "loss": 1.0182, "step": 32169 }, { "epoch": 0.97, "learning_rate": 1.2491388809837413e-08, "loss": 1.287, "step": 32170 }, { "epoch": 0.97, "learning_rate": 1.2467047525759058e-08, "loss": 1.1039, "step": 32171 }, { "epoch": 0.97, "learning_rate": 1.2442729921796349e-08, "loss": 1.1282, "step": 32172 }, { "epoch": 0.97, "learning_rate": 1.2418435998181044e-08, "loss": 1.0436, "step": 32173 }, { "epoch": 0.97, "learning_rate": 1.2394165755143794e-08, "loss": 0.9811, "step": 32174 }, { "epoch": 0.97, "learning_rate": 1.2369919192916358e-08, "loss": 1.0122, "step": 32175 }, { "epoch": 0.97, "learning_rate": 1.2345696311729104e-08, "loss": 1.0525, "step": 32176 }, { "epoch": 0.97, "learning_rate": 1.2321497111812686e-08, "loss": 1.1224, "step": 32177 }, { "epoch": 0.97, "learning_rate": 1.2297321593397472e-08, "loss": 1.0502, "step": 32178 }, { "epoch": 0.97, "learning_rate": 1.2273169756713832e-08, "loss": 0.9763, "step": 32179 }, { "epoch": 0.97, "learning_rate": 1.2249041601991308e-08, "loss": 1.2797, "step": 32180 }, { "epoch": 0.97, "learning_rate": 1.2224937129459713e-08, "loss": 0.9897, "step": 32181 }, { "epoch": 0.97, "learning_rate": 1.2200856339348588e-08, "loss": 1.0587, "step": 32182 }, { "epoch": 0.97, "learning_rate": 1.2176799231887193e-08, "loss": 1.1329, "step": 32183 }, { "epoch": 0.97, "learning_rate": 1.2152765807304512e-08, "loss": 1.0825, "step": 32184 }, { "epoch": 0.97, "learning_rate": 1.2128756065829529e-08, "loss": 1.1367, "step": 32185 }, { "epoch": 0.97, "learning_rate": 1.2104770007690392e-08, "loss": 1.1483, "step": 32186 }, { "epoch": 0.97, "learning_rate": 1.2080807633115533e-08, "loss": 1.1967, "step": 32187 }, { "epoch": 0.97, "learning_rate": 1.20568689423331e-08, "loss": 0.9671, "step": 32188 }, { "epoch": 0.97, "learning_rate": 1.2032953935571246e-08, "loss": 1.0582, "step": 32189 }, { "epoch": 0.97, "learning_rate": 1.2009062613057288e-08, "loss": 0.9991, "step": 32190 }, { "epoch": 0.97, "learning_rate": 1.19851949750191e-08, "loss": 1.2148, "step": 32191 }, { "epoch": 0.97, "learning_rate": 1.1961351021683165e-08, "loss": 1.1936, "step": 32192 }, { "epoch": 0.97, "learning_rate": 1.1937530753277082e-08, "loss": 1.1337, "step": 32193 }, { "epoch": 0.97, "learning_rate": 1.1913734170027335e-08, "loss": 1.0468, "step": 32194 }, { "epoch": 0.97, "learning_rate": 1.1889961272160689e-08, "loss": 1.1503, "step": 32195 }, { "epoch": 0.97, "learning_rate": 1.186621205990307e-08, "loss": 1.035, "step": 32196 }, { "epoch": 0.97, "learning_rate": 1.1842486533480968e-08, "loss": 1.037, "step": 32197 }, { "epoch": 0.97, "learning_rate": 1.1818784693120033e-08, "loss": 1.1866, "step": 32198 }, { "epoch": 0.97, "learning_rate": 1.179510653904592e-08, "loss": 1.1359, "step": 32199 }, { "epoch": 0.97, "learning_rate": 1.1771452071484002e-08, "loss": 0.9769, "step": 32200 }, { "epoch": 0.97, "learning_rate": 1.1747821290659379e-08, "loss": 1.0373, "step": 32201 }, { "epoch": 0.97, "learning_rate": 1.1724214196797423e-08, "loss": 1.0988, "step": 32202 }, { "epoch": 0.97, "learning_rate": 1.1700630790122403e-08, "loss": 1.0587, "step": 32203 }, { "epoch": 0.97, "learning_rate": 1.167707107085886e-08, "loss": 1.0597, "step": 32204 }, { "epoch": 0.97, "learning_rate": 1.1653535039231334e-08, "loss": 1.1393, "step": 32205 }, { "epoch": 0.97, "learning_rate": 1.163002269546354e-08, "loss": 1.3167, "step": 32206 }, { "epoch": 0.97, "learning_rate": 1.1606534039779737e-08, "loss": 0.9854, "step": 32207 }, { "epoch": 0.97, "learning_rate": 1.1583069072403087e-08, "loss": 0.9651, "step": 32208 }, { "epoch": 0.97, "learning_rate": 1.1559627793557293e-08, "loss": 1.0236, "step": 32209 }, { "epoch": 0.97, "learning_rate": 1.1536210203465237e-08, "loss": 1.0598, "step": 32210 }, { "epoch": 0.97, "learning_rate": 1.1512816302350071e-08, "loss": 0.9752, "step": 32211 }, { "epoch": 0.97, "learning_rate": 1.1489446090434397e-08, "loss": 1.1187, "step": 32212 }, { "epoch": 0.97, "learning_rate": 1.1466099567940536e-08, "loss": 1.0753, "step": 32213 }, { "epoch": 0.97, "learning_rate": 1.1442776735091088e-08, "loss": 1.1328, "step": 32214 }, { "epoch": 0.97, "learning_rate": 1.1419477592107542e-08, "loss": 0.9756, "step": 32215 }, { "epoch": 0.97, "learning_rate": 1.1396202139212498e-08, "loss": 1.0298, "step": 32216 }, { "epoch": 0.97, "learning_rate": 1.137295037662689e-08, "loss": 1.0875, "step": 32217 }, { "epoch": 0.97, "learning_rate": 1.1349722304571931e-08, "loss": 1.0973, "step": 32218 }, { "epoch": 0.97, "learning_rate": 1.1326517923269386e-08, "loss": 1.1131, "step": 32219 }, { "epoch": 0.97, "learning_rate": 1.1303337232939638e-08, "loss": 1.1969, "step": 32220 }, { "epoch": 0.97, "learning_rate": 1.1280180233803618e-08, "loss": 1.1216, "step": 32221 }, { "epoch": 0.97, "learning_rate": 1.1257046926081706e-08, "loss": 1.0804, "step": 32222 }, { "epoch": 0.97, "learning_rate": 1.1233937309994003e-08, "loss": 1.0836, "step": 32223 }, { "epoch": 0.97, "learning_rate": 1.1210851385760613e-08, "loss": 1.1144, "step": 32224 }, { "epoch": 0.97, "learning_rate": 1.118778915360108e-08, "loss": 1.1361, "step": 32225 }, { "epoch": 0.97, "learning_rate": 1.116475061373523e-08, "loss": 1.1412, "step": 32226 }, { "epoch": 0.97, "learning_rate": 1.114173576638261e-08, "loss": 1.0588, "step": 32227 }, { "epoch": 0.97, "learning_rate": 1.1118744611761656e-08, "loss": 1.0907, "step": 32228 }, { "epoch": 0.97, "learning_rate": 1.1095777150091635e-08, "loss": 1.1606, "step": 32229 }, { "epoch": 0.97, "learning_rate": 1.1072833381591263e-08, "loss": 1.0048, "step": 32230 }, { "epoch": 0.97, "learning_rate": 1.1049913306478699e-08, "loss": 1.1354, "step": 32231 }, { "epoch": 0.97, "learning_rate": 1.10270169249721e-08, "loss": 1.0746, "step": 32232 }, { "epoch": 0.97, "learning_rate": 1.1004144237289904e-08, "loss": 1.0688, "step": 32233 }, { "epoch": 0.97, "learning_rate": 1.0981295243649159e-08, "loss": 1.0792, "step": 32234 }, { "epoch": 0.97, "learning_rate": 1.0958469944268023e-08, "loss": 1.1178, "step": 32235 }, { "epoch": 0.97, "learning_rate": 1.093566833936327e-08, "loss": 1.0888, "step": 32236 }, { "epoch": 0.97, "learning_rate": 1.0912890429152501e-08, "loss": 1.1741, "step": 32237 }, { "epoch": 0.97, "learning_rate": 1.0890136213851932e-08, "loss": 1.1832, "step": 32238 }, { "epoch": 0.97, "learning_rate": 1.0867405693678334e-08, "loss": 1.1032, "step": 32239 }, { "epoch": 0.97, "learning_rate": 1.084469886884848e-08, "loss": 1.0233, "step": 32240 }, { "epoch": 0.97, "learning_rate": 1.0822015739578307e-08, "loss": 1.1513, "step": 32241 }, { "epoch": 0.97, "learning_rate": 1.0799356306083752e-08, "loss": 1.1025, "step": 32242 }, { "epoch": 0.97, "learning_rate": 1.0776720568580201e-08, "loss": 1.0541, "step": 32243 }, { "epoch": 0.97, "learning_rate": 1.0754108527283591e-08, "loss": 1.0687, "step": 32244 }, { "epoch": 0.97, "learning_rate": 1.0731520182409027e-08, "loss": 1.1423, "step": 32245 }, { "epoch": 0.97, "learning_rate": 1.0708955534171616e-08, "loss": 1.1401, "step": 32246 }, { "epoch": 0.97, "learning_rate": 1.0686414582785909e-08, "loss": 1.0541, "step": 32247 }, { "epoch": 0.97, "learning_rate": 1.0663897328466455e-08, "loss": 1.1791, "step": 32248 }, { "epoch": 0.97, "learning_rate": 1.0641403771428082e-08, "loss": 1.0779, "step": 32249 }, { "epoch": 0.97, "learning_rate": 1.061893391188451e-08, "loss": 1.0324, "step": 32250 }, { "epoch": 0.97, "learning_rate": 1.0596487750049734e-08, "loss": 1.0801, "step": 32251 }, { "epoch": 0.97, "learning_rate": 1.0574065286137747e-08, "loss": 1.0723, "step": 32252 }, { "epoch": 0.97, "learning_rate": 1.0551666520361437e-08, "loss": 1.0315, "step": 32253 }, { "epoch": 0.97, "learning_rate": 1.0529291452934244e-08, "loss": 1.1265, "step": 32254 }, { "epoch": 0.97, "learning_rate": 1.0506940084069329e-08, "loss": 0.9989, "step": 32255 }, { "epoch": 0.97, "learning_rate": 1.0484612413979301e-08, "loss": 1.2179, "step": 32256 }, { "epoch": 0.97, "learning_rate": 1.0462308442877045e-08, "loss": 1.0564, "step": 32257 }, { "epoch": 0.97, "learning_rate": 1.0440028170974337e-08, "loss": 1.0771, "step": 32258 }, { "epoch": 0.97, "learning_rate": 1.0417771598483784e-08, "loss": 1.0723, "step": 32259 }, { "epoch": 0.97, "learning_rate": 1.0395538725616605e-08, "loss": 0.9776, "step": 32260 }, { "epoch": 0.97, "learning_rate": 1.0373329552585133e-08, "loss": 1.1885, "step": 32261 }, { "epoch": 0.97, "learning_rate": 1.0351144079600584e-08, "loss": 1.2202, "step": 32262 }, { "epoch": 0.97, "learning_rate": 1.032898230687418e-08, "loss": 1.1183, "step": 32263 }, { "epoch": 0.97, "learning_rate": 1.0306844234616586e-08, "loss": 1.1022, "step": 32264 }, { "epoch": 0.97, "learning_rate": 1.0284729863038745e-08, "loss": 1.0422, "step": 32265 }, { "epoch": 0.97, "learning_rate": 1.0262639192351042e-08, "loss": 1.0303, "step": 32266 }, { "epoch": 0.97, "learning_rate": 1.0240572222764144e-08, "loss": 0.9656, "step": 32267 }, { "epoch": 0.97, "learning_rate": 1.0218528954487883e-08, "loss": 1.1469, "step": 32268 }, { "epoch": 0.97, "learning_rate": 1.019650938773209e-08, "loss": 1.1701, "step": 32269 }, { "epoch": 0.97, "learning_rate": 1.017451352270632e-08, "loss": 1.0115, "step": 32270 }, { "epoch": 0.97, "learning_rate": 1.0152541359620127e-08, "loss": 1.1409, "step": 32271 }, { "epoch": 0.97, "learning_rate": 1.013059289868279e-08, "loss": 1.073, "step": 32272 }, { "epoch": 0.97, "learning_rate": 1.0108668140102752e-08, "loss": 1.1491, "step": 32273 }, { "epoch": 0.97, "learning_rate": 1.008676708408901e-08, "loss": 1.2151, "step": 32274 }, { "epoch": 0.97, "learning_rate": 1.0064889730850014e-08, "loss": 1.0823, "step": 32275 }, { "epoch": 0.97, "learning_rate": 1.0043036080594205e-08, "loss": 1.0081, "step": 32276 }, { "epoch": 0.97, "learning_rate": 1.002120613352947e-08, "loss": 1.0418, "step": 32277 }, { "epoch": 0.97, "learning_rate": 9.999399889863703e-09, "loss": 1.0154, "step": 32278 }, { "epoch": 0.97, "learning_rate": 9.977617349804514e-09, "loss": 1.0721, "step": 32279 }, { "epoch": 0.97, "learning_rate": 9.955858513558959e-09, "loss": 1.0013, "step": 32280 }, { "epoch": 0.97, "learning_rate": 9.934123381334371e-09, "loss": 1.0646, "step": 32281 }, { "epoch": 0.97, "learning_rate": 9.912411953337809e-09, "loss": 1.2466, "step": 32282 }, { "epoch": 0.97, "learning_rate": 9.890724229775773e-09, "loss": 1.0565, "step": 32283 }, { "epoch": 0.97, "learning_rate": 9.869060210854764e-09, "loss": 1.1318, "step": 32284 }, { "epoch": 0.97, "learning_rate": 9.847419896781007e-09, "loss": 1.0599, "step": 32285 }, { "epoch": 0.97, "learning_rate": 9.82580328776045e-09, "loss": 1.1633, "step": 32286 }, { "epoch": 0.97, "learning_rate": 9.804210383999035e-09, "loss": 1.085, "step": 32287 }, { "epoch": 0.97, "learning_rate": 9.782641185702157e-09, "loss": 1.1171, "step": 32288 }, { "epoch": 0.97, "learning_rate": 9.761095693075206e-09, "loss": 1.0875, "step": 32289 }, { "epoch": 0.97, "learning_rate": 9.739573906323296e-09, "loss": 1.0843, "step": 32290 }, { "epoch": 0.97, "learning_rate": 9.718075825651264e-09, "loss": 1.0919, "step": 32291 }, { "epoch": 0.97, "learning_rate": 9.696601451263942e-09, "loss": 1.1373, "step": 32292 }, { "epoch": 0.97, "learning_rate": 9.675150783365339e-09, "loss": 1.1404, "step": 32293 }, { "epoch": 0.97, "learning_rate": 9.653723822160287e-09, "loss": 1.1466, "step": 32294 }, { "epoch": 0.97, "learning_rate": 9.632320567852239e-09, "loss": 1.1821, "step": 32295 }, { "epoch": 0.97, "learning_rate": 9.610941020644915e-09, "loss": 1.0825, "step": 32296 }, { "epoch": 0.97, "learning_rate": 9.589585180742044e-09, "loss": 1.098, "step": 32297 }, { "epoch": 0.97, "learning_rate": 9.568253048347075e-09, "loss": 1.2363, "step": 32298 }, { "epoch": 0.97, "learning_rate": 9.546944623662901e-09, "loss": 1.1172, "step": 32299 }, { "epoch": 0.97, "learning_rate": 9.525659906892138e-09, "loss": 0.9097, "step": 32300 }, { "epoch": 0.97, "learning_rate": 9.504398898237955e-09, "loss": 1.0856, "step": 32301 }, { "epoch": 0.97, "learning_rate": 9.483161597902412e-09, "loss": 1.0341, "step": 32302 }, { "epoch": 0.97, "learning_rate": 9.461948006087296e-09, "loss": 0.9861, "step": 32303 }, { "epoch": 0.97, "learning_rate": 9.44075812299522e-09, "loss": 0.9123, "step": 32304 }, { "epoch": 0.97, "learning_rate": 9.419591948827689e-09, "loss": 1.1392, "step": 32305 }, { "epoch": 0.97, "learning_rate": 9.398449483785932e-09, "loss": 0.9457, "step": 32306 }, { "epoch": 0.97, "learning_rate": 9.377330728071732e-09, "loss": 1.0699, "step": 32307 }, { "epoch": 0.97, "learning_rate": 9.356235681885484e-09, "loss": 1.0717, "step": 32308 }, { "epoch": 0.97, "learning_rate": 9.335164345428415e-09, "loss": 1.1133, "step": 32309 }, { "epoch": 0.97, "learning_rate": 9.3141167189012e-09, "loss": 1.0747, "step": 32310 }, { "epoch": 0.97, "learning_rate": 9.293092802503956e-09, "loss": 1.1505, "step": 32311 }, { "epoch": 0.97, "learning_rate": 9.272092596437077e-09, "loss": 1.0567, "step": 32312 }, { "epoch": 0.97, "learning_rate": 9.251116100900127e-09, "loss": 0.9261, "step": 32313 }, { "epoch": 0.97, "learning_rate": 9.230163316092944e-09, "loss": 1.0665, "step": 32314 }, { "epoch": 0.97, "learning_rate": 9.209234242215093e-09, "loss": 0.9871, "step": 32315 }, { "epoch": 0.97, "learning_rate": 9.18832887946558e-09, "loss": 1.0899, "step": 32316 }, { "epoch": 0.97, "learning_rate": 9.167447228043691e-09, "loss": 1.0623, "step": 32317 }, { "epoch": 0.97, "learning_rate": 9.146589288147877e-09, "loss": 1.0087, "step": 32318 }, { "epoch": 0.97, "learning_rate": 9.125755059977149e-09, "loss": 1.2467, "step": 32319 }, { "epoch": 0.97, "learning_rate": 9.1049445437294e-09, "loss": 1.1689, "step": 32320 }, { "epoch": 0.97, "learning_rate": 9.084157739603083e-09, "loss": 0.9968, "step": 32321 }, { "epoch": 0.97, "learning_rate": 9.06339464779582e-09, "loss": 1.1396, "step": 32322 }, { "epoch": 0.97, "learning_rate": 9.042655268505506e-09, "loss": 1.0665, "step": 32323 }, { "epoch": 0.97, "learning_rate": 9.021939601929209e-09, "loss": 1.2098, "step": 32324 }, { "epoch": 0.97, "learning_rate": 9.001247648264545e-09, "loss": 1.062, "step": 32325 }, { "epoch": 0.97, "learning_rate": 8.9805794077083e-09, "loss": 0.9898, "step": 32326 }, { "epoch": 0.97, "learning_rate": 8.959934880456989e-09, "loss": 1.1451, "step": 32327 }, { "epoch": 0.97, "learning_rate": 8.939314066707672e-09, "loss": 1.0358, "step": 32328 }, { "epoch": 0.97, "learning_rate": 8.918716966656026e-09, "loss": 1.0682, "step": 32329 }, { "epoch": 0.97, "learning_rate": 8.898143580498564e-09, "loss": 1.0883, "step": 32330 }, { "epoch": 0.97, "learning_rate": 8.877593908431237e-09, "loss": 1.0489, "step": 32331 }, { "epoch": 0.97, "learning_rate": 8.857067950649167e-09, "loss": 1.058, "step": 32332 }, { "epoch": 0.97, "learning_rate": 8.836565707348033e-09, "loss": 1.0659, "step": 32333 }, { "epoch": 0.97, "learning_rate": 8.816087178723231e-09, "loss": 1.1172, "step": 32334 }, { "epoch": 0.97, "learning_rate": 8.795632364969331e-09, "loss": 1.0728, "step": 32335 }, { "epoch": 0.97, "learning_rate": 8.775201266281174e-09, "loss": 1.0164, "step": 32336 }, { "epoch": 0.97, "learning_rate": 8.754793882853606e-09, "loss": 1.1564, "step": 32337 }, { "epoch": 0.97, "learning_rate": 8.734410214880363e-09, "loss": 1.0857, "step": 32338 }, { "epoch": 0.97, "learning_rate": 8.714050262555452e-09, "loss": 1.1276, "step": 32339 }, { "epoch": 0.97, "learning_rate": 8.693714026073163e-09, "loss": 1.0186, "step": 32340 }, { "epoch": 0.97, "learning_rate": 8.673401505626956e-09, "loss": 1.0894, "step": 32341 }, { "epoch": 0.97, "learning_rate": 8.653112701410005e-09, "loss": 1.0152, "step": 32342 }, { "epoch": 0.97, "learning_rate": 8.632847613615492e-09, "loss": 1.3068, "step": 32343 }, { "epoch": 0.97, "learning_rate": 8.612606242436317e-09, "loss": 1.0107, "step": 32344 }, { "epoch": 0.97, "learning_rate": 8.592388588065382e-09, "loss": 1.0499, "step": 32345 }, { "epoch": 0.97, "learning_rate": 8.572194650695031e-09, "loss": 1.0676, "step": 32346 }, { "epoch": 0.97, "learning_rate": 8.552024430517613e-09, "loss": 1.0692, "step": 32347 }, { "epoch": 0.97, "learning_rate": 8.531877927724641e-09, "loss": 1.0576, "step": 32348 }, { "epoch": 0.97, "learning_rate": 8.51175514250846e-09, "loss": 1.2061, "step": 32349 }, { "epoch": 0.97, "learning_rate": 8.491656075060584e-09, "loss": 1.062, "step": 32350 }, { "epoch": 0.97, "learning_rate": 8.471580725571971e-09, "loss": 1.1083, "step": 32351 }, { "epoch": 0.97, "learning_rate": 8.451529094233857e-09, "loss": 1.077, "step": 32352 }, { "epoch": 0.97, "learning_rate": 8.431501181237478e-09, "loss": 1.0482, "step": 32353 }, { "epoch": 0.97, "learning_rate": 8.41149698677296e-09, "loss": 1.1935, "step": 32354 }, { "epoch": 0.97, "learning_rate": 8.39151651103126e-09, "loss": 1.1384, "step": 32355 }, { "epoch": 0.97, "learning_rate": 8.37155975420223e-09, "loss": 1.0097, "step": 32356 }, { "epoch": 0.97, "learning_rate": 8.351626716475713e-09, "loss": 1.0839, "step": 32357 }, { "epoch": 0.97, "learning_rate": 8.331717398041839e-09, "loss": 1.0058, "step": 32358 }, { "epoch": 0.97, "learning_rate": 8.311831799090175e-09, "loss": 1.0312, "step": 32359 }, { "epoch": 0.97, "learning_rate": 8.291969919809461e-09, "loss": 0.9178, "step": 32360 }, { "epoch": 0.97, "learning_rate": 8.272131760389545e-09, "loss": 1.1338, "step": 32361 }, { "epoch": 0.97, "learning_rate": 8.25231732101861e-09, "loss": 1.2524, "step": 32362 }, { "epoch": 0.97, "learning_rate": 8.23252660188567e-09, "loss": 1.071, "step": 32363 }, { "epoch": 0.97, "learning_rate": 8.21275960317891e-09, "loss": 1.1588, "step": 32364 }, { "epoch": 0.97, "learning_rate": 8.19301632508679e-09, "loss": 1.1115, "step": 32365 }, { "epoch": 0.98, "learning_rate": 8.173296767796934e-09, "loss": 1.1391, "step": 32366 }, { "epoch": 0.98, "learning_rate": 8.153600931497253e-09, "loss": 1.0914, "step": 32367 }, { "epoch": 0.98, "learning_rate": 8.133928816375091e-09, "loss": 1.1705, "step": 32368 }, { "epoch": 0.98, "learning_rate": 8.114280422617804e-09, "loss": 1.0513, "step": 32369 }, { "epoch": 0.98, "learning_rate": 8.094655750412461e-09, "loss": 1.078, "step": 32370 }, { "epoch": 0.98, "learning_rate": 8.075054799945858e-09, "loss": 1.1055, "step": 32371 }, { "epoch": 0.98, "learning_rate": 8.055477571404514e-09, "loss": 1.114, "step": 32372 }, { "epoch": 0.98, "learning_rate": 8.035924064974943e-09, "loss": 1.0952, "step": 32373 }, { "epoch": 0.98, "learning_rate": 8.01639428084311e-09, "loss": 1.0546, "step": 32374 }, { "epoch": 0.98, "learning_rate": 7.996888219194975e-09, "loss": 1.0975, "step": 32375 }, { "epoch": 0.98, "learning_rate": 7.977405880216505e-09, "loss": 1.104, "step": 32376 }, { "epoch": 0.98, "learning_rate": 7.957947264092825e-09, "loss": 1.0142, "step": 32377 }, { "epoch": 0.98, "learning_rate": 7.938512371009066e-09, "loss": 1.0611, "step": 32378 }, { "epoch": 0.98, "learning_rate": 7.919101201150637e-09, "loss": 1.1364, "step": 32379 }, { "epoch": 0.98, "learning_rate": 7.899713754702388e-09, "loss": 1.1249, "step": 32380 }, { "epoch": 0.98, "learning_rate": 7.880350031848339e-09, "loss": 1.2734, "step": 32381 }, { "epoch": 0.98, "learning_rate": 7.861010032773065e-09, "loss": 0.9941, "step": 32382 }, { "epoch": 0.98, "learning_rate": 7.841693757660861e-09, "loss": 1.0834, "step": 32383 }, { "epoch": 0.98, "learning_rate": 7.822401206695474e-09, "loss": 1.1321, "step": 32384 }, { "epoch": 0.98, "learning_rate": 7.803132380060363e-09, "loss": 1.045, "step": 32385 }, { "epoch": 0.98, "learning_rate": 7.783887277939273e-09, "loss": 1.0479, "step": 32386 }, { "epoch": 0.98, "learning_rate": 7.76466590051539e-09, "loss": 1.1682, "step": 32387 }, { "epoch": 0.98, "learning_rate": 7.745468247971343e-09, "loss": 1.1753, "step": 32388 }, { "epoch": 0.98, "learning_rate": 7.726294320490325e-09, "loss": 1.0698, "step": 32389 }, { "epoch": 0.98, "learning_rate": 7.707144118254684e-09, "loss": 1.1418, "step": 32390 }, { "epoch": 0.98, "learning_rate": 7.6880176414465e-09, "loss": 1.1094, "step": 32391 }, { "epoch": 0.98, "learning_rate": 7.668914890248403e-09, "loss": 1.1028, "step": 32392 }, { "epoch": 0.98, "learning_rate": 7.649835864841637e-09, "loss": 1.0488, "step": 32393 }, { "epoch": 0.98, "learning_rate": 7.630780565408002e-09, "loss": 1.0711, "step": 32394 }, { "epoch": 0.98, "learning_rate": 7.61174899212902e-09, "loss": 1.0685, "step": 32395 }, { "epoch": 0.98, "learning_rate": 7.592741145185933e-09, "loss": 1.1194, "step": 32396 }, { "epoch": 0.98, "learning_rate": 7.573757024759709e-09, "loss": 1.0906, "step": 32397 }, { "epoch": 0.98, "learning_rate": 7.554796631030481e-09, "loss": 1.0951, "step": 32398 }, { "epoch": 0.98, "learning_rate": 7.535859964179493e-09, "loss": 1.1421, "step": 32399 }, { "epoch": 0.98, "learning_rate": 7.5169470243866e-09, "loss": 1.1073, "step": 32400 }, { "epoch": 0.98, "learning_rate": 7.498057811831937e-09, "loss": 1.0613, "step": 32401 }, { "epoch": 0.98, "learning_rate": 7.479192326695638e-09, "loss": 1.0477, "step": 32402 }, { "epoch": 0.98, "learning_rate": 7.46035056915645e-09, "loss": 1.1135, "step": 32403 }, { "epoch": 0.98, "learning_rate": 7.44153253939478e-09, "loss": 1.1343, "step": 32404 }, { "epoch": 0.98, "learning_rate": 7.422738237588822e-09, "loss": 1.2129, "step": 32405 }, { "epoch": 0.98, "learning_rate": 7.403967663918432e-09, "loss": 1.1201, "step": 32406 }, { "epoch": 0.98, "learning_rate": 7.385220818561245e-09, "loss": 1.0242, "step": 32407 }, { "epoch": 0.98, "learning_rate": 7.3664977016965626e-09, "loss": 1.0931, "step": 32408 }, { "epoch": 0.98, "learning_rate": 7.347798313502297e-09, "loss": 1.1352, "step": 32409 }, { "epoch": 0.98, "learning_rate": 7.32912265415664e-09, "loss": 1.1661, "step": 32410 }, { "epoch": 0.98, "learning_rate": 7.310470723836949e-09, "loss": 1.0197, "step": 32411 }, { "epoch": 0.98, "learning_rate": 7.291842522721415e-09, "loss": 1.079, "step": 32412 }, { "epoch": 0.98, "learning_rate": 7.273238050986564e-09, "loss": 1.1975, "step": 32413 }, { "epoch": 0.98, "learning_rate": 7.254657308810309e-09, "loss": 1.1544, "step": 32414 }, { "epoch": 0.98, "learning_rate": 7.236100296368898e-09, "loss": 1.0768, "step": 32415 }, { "epoch": 0.98, "learning_rate": 7.2175670138394106e-09, "loss": 1.1495, "step": 32416 }, { "epoch": 0.98, "learning_rate": 7.199057461398095e-09, "loss": 1.124, "step": 32417 }, { "epoch": 0.98, "learning_rate": 7.180571639221201e-09, "loss": 1.0035, "step": 32418 }, { "epoch": 0.98, "learning_rate": 7.162109547484697e-09, "loss": 1.0455, "step": 32419 }, { "epoch": 0.98, "learning_rate": 7.143671186364276e-09, "loss": 1.0928, "step": 32420 }, { "epoch": 0.98, "learning_rate": 7.125256556035354e-09, "loss": 1.1298, "step": 32421 }, { "epoch": 0.98, "learning_rate": 7.106865656673623e-09, "loss": 1.1865, "step": 32422 }, { "epoch": 0.98, "learning_rate": 7.088498488453943e-09, "loss": 1.1432, "step": 32423 }, { "epoch": 0.98, "learning_rate": 7.070155051550898e-09, "loss": 1.0673, "step": 32424 }, { "epoch": 0.98, "learning_rate": 7.051835346139346e-09, "loss": 1.1373, "step": 32425 }, { "epoch": 0.98, "learning_rate": 7.033539372393872e-09, "loss": 1.0493, "step": 32426 }, { "epoch": 0.98, "learning_rate": 7.015267130488223e-09, "loss": 1.0778, "step": 32427 }, { "epoch": 0.98, "learning_rate": 6.997018620596985e-09, "loss": 1.1292, "step": 32428 }, { "epoch": 0.98, "learning_rate": 6.978793842893072e-09, "loss": 1.1078, "step": 32429 }, { "epoch": 0.98, "learning_rate": 6.960592797550514e-09, "loss": 1.1899, "step": 32430 }, { "epoch": 0.98, "learning_rate": 6.942415484742226e-09, "loss": 1.04, "step": 32431 }, { "epoch": 0.98, "learning_rate": 6.924261904641682e-09, "loss": 1.0472, "step": 32432 }, { "epoch": 0.98, "learning_rate": 6.906132057421522e-09, "loss": 1.1293, "step": 32433 }, { "epoch": 0.98, "learning_rate": 6.8880259432541066e-09, "loss": 0.9515, "step": 32434 }, { "epoch": 0.98, "learning_rate": 6.869943562311798e-09, "loss": 1.0689, "step": 32435 }, { "epoch": 0.98, "learning_rate": 6.851884914767237e-09, "loss": 1.2748, "step": 32436 }, { "epoch": 0.98, "learning_rate": 6.833850000791675e-09, "loss": 1.1932, "step": 32437 }, { "epoch": 0.98, "learning_rate": 6.815838820557474e-09, "loss": 1.0554, "step": 32438 }, { "epoch": 0.98, "learning_rate": 6.797851374235331e-09, "loss": 1.0097, "step": 32439 }, { "epoch": 0.98, "learning_rate": 6.779887661997054e-09, "loss": 1.1466, "step": 32440 }, { "epoch": 0.98, "learning_rate": 6.761947684013614e-09, "loss": 1.1191, "step": 32441 }, { "epoch": 0.98, "learning_rate": 6.744031440455434e-09, "loss": 1.1445, "step": 32442 }, { "epoch": 0.98, "learning_rate": 6.726138931493209e-09, "loss": 1.2711, "step": 32443 }, { "epoch": 0.98, "learning_rate": 6.708270157297636e-09, "loss": 1.0488, "step": 32444 }, { "epoch": 0.98, "learning_rate": 6.690425118038302e-09, "loss": 1.0294, "step": 32445 }, { "epoch": 0.98, "learning_rate": 6.672603813885348e-09, "loss": 1.0305, "step": 32446 }, { "epoch": 0.98, "learning_rate": 6.6548062450083605e-09, "loss": 1.0813, "step": 32447 }, { "epoch": 0.98, "learning_rate": 6.637032411576927e-09, "loss": 1.0101, "step": 32448 }, { "epoch": 0.98, "learning_rate": 6.619282313760078e-09, "loss": 0.9954, "step": 32449 }, { "epoch": 0.98, "learning_rate": 6.601555951726568e-09, "loss": 1.1716, "step": 32450 }, { "epoch": 0.98, "learning_rate": 6.583853325645706e-09, "loss": 1.1389, "step": 32451 }, { "epoch": 0.98, "learning_rate": 6.566174435685413e-09, "loss": 1.018, "step": 32452 }, { "epoch": 0.98, "learning_rate": 6.548519282014443e-09, "loss": 1.0961, "step": 32453 }, { "epoch": 0.98, "learning_rate": 6.530887864800717e-09, "loss": 1.0795, "step": 32454 }, { "epoch": 0.98, "learning_rate": 6.513280184211878e-09, "loss": 1.03, "step": 32455 }, { "epoch": 0.98, "learning_rate": 6.495696240415572e-09, "loss": 1.1017, "step": 32456 }, { "epoch": 0.98, "learning_rate": 6.4781360335797184e-09, "loss": 1.0852, "step": 32457 }, { "epoch": 0.98, "learning_rate": 6.460599563870851e-09, "loss": 1.1778, "step": 32458 }, { "epoch": 0.98, "learning_rate": 6.443086831456058e-09, "loss": 1.0931, "step": 32459 }, { "epoch": 0.98, "learning_rate": 6.425597836502428e-09, "loss": 1.098, "step": 32460 }, { "epoch": 0.98, "learning_rate": 6.408132579175941e-09, "loss": 1.113, "step": 32461 }, { "epoch": 0.98, "learning_rate": 6.390691059643128e-09, "loss": 1.029, "step": 32462 }, { "epoch": 0.98, "learning_rate": 6.373273278069969e-09, "loss": 1.084, "step": 32463 }, { "epoch": 0.98, "learning_rate": 6.355879234622164e-09, "loss": 1.0249, "step": 32464 }, { "epoch": 0.98, "learning_rate": 6.3385089294656925e-09, "loss": 1.1052, "step": 32465 }, { "epoch": 0.98, "learning_rate": 6.321162362765421e-09, "loss": 0.9319, "step": 32466 }, { "epoch": 0.98, "learning_rate": 6.303839534686773e-09, "loss": 1.1909, "step": 32467 }, { "epoch": 0.98, "learning_rate": 6.2865404453946176e-09, "loss": 1.2425, "step": 32468 }, { "epoch": 0.98, "learning_rate": 6.269265095053267e-09, "loss": 1.022, "step": 32469 }, { "epoch": 0.98, "learning_rate": 6.252013483827868e-09, "loss": 1.1049, "step": 32470 }, { "epoch": 0.98, "learning_rate": 6.234785611882177e-09, "loss": 1.0953, "step": 32471 }, { "epoch": 0.98, "learning_rate": 6.217581479379953e-09, "loss": 1.0559, "step": 32472 }, { "epoch": 0.98, "learning_rate": 6.200401086485786e-09, "loss": 0.9772, "step": 32473 }, { "epoch": 0.98, "learning_rate": 6.183244433362323e-09, "loss": 1.1921, "step": 32474 }, { "epoch": 0.98, "learning_rate": 6.166111520173601e-09, "loss": 1.0353, "step": 32475 }, { "epoch": 0.98, "learning_rate": 6.149002347082544e-09, "loss": 1.0784, "step": 32476 }, { "epoch": 0.98, "learning_rate": 6.131916914251524e-09, "loss": 1.0784, "step": 32477 }, { "epoch": 0.98, "learning_rate": 6.1148552218437404e-09, "loss": 1.0605, "step": 32478 }, { "epoch": 0.98, "learning_rate": 6.097817270021567e-09, "loss": 1.0583, "step": 32479 }, { "epoch": 0.98, "learning_rate": 6.080803058947093e-09, "loss": 1.0915, "step": 32480 }, { "epoch": 0.98, "learning_rate": 6.063812588781859e-09, "loss": 1.0917, "step": 32481 }, { "epoch": 0.98, "learning_rate": 6.04684585968851e-09, "loss": 1.0431, "step": 32482 }, { "epoch": 0.98, "learning_rate": 6.029902871827753e-09, "loss": 1.0805, "step": 32483 }, { "epoch": 0.98, "learning_rate": 6.012983625361124e-09, "loss": 1.0807, "step": 32484 }, { "epoch": 0.98, "learning_rate": 5.996088120449884e-09, "loss": 1.103, "step": 32485 }, { "epoch": 0.98, "learning_rate": 5.979216357254736e-09, "loss": 1.0273, "step": 32486 }, { "epoch": 0.98, "learning_rate": 5.962368335936386e-09, "loss": 1.0938, "step": 32487 }, { "epoch": 0.98, "learning_rate": 5.945544056654984e-09, "loss": 1.0557, "step": 32488 }, { "epoch": 0.98, "learning_rate": 5.928743519570957e-09, "loss": 1.0009, "step": 32489 }, { "epoch": 0.98, "learning_rate": 5.911966724843899e-09, "loss": 1.0597, "step": 32490 }, { "epoch": 0.98, "learning_rate": 5.895213672633682e-09, "loss": 1.0495, "step": 32491 }, { "epoch": 0.98, "learning_rate": 5.878484363100179e-09, "loss": 1.213, "step": 32492 }, { "epoch": 0.98, "learning_rate": 5.861778796402151e-09, "loss": 1.2117, "step": 32493 }, { "epoch": 0.98, "learning_rate": 5.845096972698638e-09, "loss": 1.1191, "step": 32494 }, { "epoch": 0.98, "learning_rate": 5.82843889214868e-09, "loss": 1.2012, "step": 32495 }, { "epoch": 0.98, "learning_rate": 5.811804554910483e-09, "loss": 1.0813, "step": 32496 }, { "epoch": 0.98, "learning_rate": 5.795193961143086e-09, "loss": 1.0425, "step": 32497 }, { "epoch": 0.98, "learning_rate": 5.778607111003864e-09, "loss": 1.0366, "step": 32498 }, { "epoch": 0.98, "learning_rate": 5.762044004651302e-09, "loss": 1.1232, "step": 32499 }, { "epoch": 0.98, "learning_rate": 5.745504642242494e-09, "loss": 1.1447, "step": 32500 }, { "epoch": 0.98, "learning_rate": 5.728989023935649e-09, "loss": 1.1318, "step": 32501 }, { "epoch": 0.98, "learning_rate": 5.712497149887308e-09, "loss": 1.0199, "step": 32502 }, { "epoch": 0.98, "learning_rate": 5.696029020254567e-09, "loss": 1.1353, "step": 32503 }, { "epoch": 0.98, "learning_rate": 5.6795846351945235e-09, "loss": 1.0341, "step": 32504 }, { "epoch": 0.98, "learning_rate": 5.663163994863441e-09, "loss": 1.155, "step": 32505 }, { "epoch": 0.98, "learning_rate": 5.64676709941786e-09, "loss": 1.0893, "step": 32506 }, { "epoch": 0.98, "learning_rate": 5.630393949013491e-09, "loss": 1.0992, "step": 32507 }, { "epoch": 0.98, "learning_rate": 5.614044543806596e-09, "loss": 1.1069, "step": 32508 }, { "epoch": 0.98, "learning_rate": 5.597718883952607e-09, "loss": 1.0738, "step": 32509 }, { "epoch": 0.98, "learning_rate": 5.581416969606957e-09, "loss": 1.1644, "step": 32510 }, { "epoch": 0.98, "learning_rate": 5.565138800925074e-09, "loss": 1.0945, "step": 32511 }, { "epoch": 0.98, "learning_rate": 5.548884378061559e-09, "loss": 1.0604, "step": 32512 }, { "epoch": 0.98, "learning_rate": 5.532653701171286e-09, "loss": 1.2464, "step": 32513 }, { "epoch": 0.98, "learning_rate": 5.5164467704088566e-09, "loss": 1.093, "step": 32514 }, { "epoch": 0.98, "learning_rate": 5.500263585928311e-09, "loss": 1.0667, "step": 32515 }, { "epoch": 0.98, "learning_rate": 5.484104147883973e-09, "loss": 1.1332, "step": 32516 }, { "epoch": 0.98, "learning_rate": 5.467968456429607e-09, "loss": 1.0869, "step": 32517 }, { "epoch": 0.98, "learning_rate": 5.4518565117187e-09, "loss": 1.1408, "step": 32518 }, { "epoch": 0.98, "learning_rate": 5.4357683139047436e-09, "loss": 1.0555, "step": 32519 }, { "epoch": 0.98, "learning_rate": 5.419703863140669e-09, "loss": 1.0792, "step": 32520 }, { "epoch": 0.98, "learning_rate": 5.403663159579686e-09, "loss": 1.1612, "step": 32521 }, { "epoch": 0.98, "learning_rate": 5.3876462033744524e-09, "loss": 0.9602, "step": 32522 }, { "epoch": 0.98, "learning_rate": 5.371652994677345e-09, "loss": 1.1098, "step": 32523 }, { "epoch": 0.98, "learning_rate": 5.355683533640743e-09, "loss": 1.1166, "step": 32524 }, { "epoch": 0.98, "learning_rate": 5.339737820416469e-09, "loss": 1.0582, "step": 32525 }, { "epoch": 0.98, "learning_rate": 5.323815855156622e-09, "loss": 0.9882, "step": 32526 }, { "epoch": 0.98, "learning_rate": 5.307917638012195e-09, "loss": 1.0654, "step": 32527 }, { "epoch": 0.98, "learning_rate": 5.292043169135286e-09, "loss": 1.028, "step": 32528 }, { "epoch": 0.98, "learning_rate": 5.276192448676331e-09, "loss": 1.0421, "step": 32529 }, { "epoch": 0.98, "learning_rate": 5.2603654767866e-09, "loss": 1.0629, "step": 32530 }, { "epoch": 0.98, "learning_rate": 5.244562253616803e-09, "loss": 1.0819, "step": 32531 }, { "epoch": 0.98, "learning_rate": 5.2287827793170985e-09, "loss": 1.0402, "step": 32532 }, { "epoch": 0.98, "learning_rate": 5.213027054037922e-09, "loss": 1.0789, "step": 32533 }, { "epoch": 0.98, "learning_rate": 5.1972950779294315e-09, "loss": 1.1253, "step": 32534 }, { "epoch": 0.98, "learning_rate": 5.181586851140952e-09, "loss": 1.053, "step": 32535 }, { "epoch": 0.98, "learning_rate": 5.1659023738220845e-09, "loss": 1.0714, "step": 32536 }, { "epoch": 0.98, "learning_rate": 5.150241646122434e-09, "loss": 1.2047, "step": 32537 }, { "epoch": 0.98, "learning_rate": 5.134604668191046e-09, "loss": 0.9828, "step": 32538 }, { "epoch": 0.98, "learning_rate": 5.118991440176413e-09, "loss": 1.0327, "step": 32539 }, { "epoch": 0.98, "learning_rate": 5.103401962227583e-09, "loss": 0.976, "step": 32540 }, { "epoch": 0.98, "learning_rate": 5.087836234492494e-09, "loss": 1.0768, "step": 32541 }, { "epoch": 0.98, "learning_rate": 5.072294257119914e-09, "loss": 0.9483, "step": 32542 }, { "epoch": 0.98, "learning_rate": 5.056776030257227e-09, "loss": 1.1124, "step": 32543 }, { "epoch": 0.98, "learning_rate": 5.041281554052646e-09, "loss": 1.0861, "step": 32544 }, { "epoch": 0.98, "learning_rate": 5.0258108286535545e-09, "loss": 1.0483, "step": 32545 }, { "epoch": 0.98, "learning_rate": 5.010363854206779e-09, "loss": 1.0048, "step": 32546 }, { "epoch": 0.98, "learning_rate": 4.994940630859979e-09, "loss": 1.0233, "step": 32547 }, { "epoch": 0.98, "learning_rate": 4.9795411587597045e-09, "loss": 1.0973, "step": 32548 }, { "epoch": 0.98, "learning_rate": 4.964165438052504e-09, "loss": 1.0595, "step": 32549 }, { "epoch": 0.98, "learning_rate": 4.94881346888465e-09, "loss": 1.1553, "step": 32550 }, { "epoch": 0.98, "learning_rate": 4.933485251402692e-09, "loss": 1.1311, "step": 32551 }, { "epoch": 0.98, "learning_rate": 4.918180785752069e-09, "loss": 1.0249, "step": 32552 }, { "epoch": 0.98, "learning_rate": 4.902900072078775e-09, "loss": 1.1226, "step": 32553 }, { "epoch": 0.98, "learning_rate": 4.887643110528251e-09, "loss": 1.1137, "step": 32554 }, { "epoch": 0.98, "learning_rate": 4.872409901245379e-09, "loss": 1.1719, "step": 32555 }, { "epoch": 0.98, "learning_rate": 4.857200444375876e-09, "loss": 1.1305, "step": 32556 }, { "epoch": 0.98, "learning_rate": 4.842014740063794e-09, "loss": 1.033, "step": 32557 }, { "epoch": 0.98, "learning_rate": 4.826852788454295e-09, "loss": 1.0668, "step": 32558 }, { "epoch": 0.98, "learning_rate": 4.81171458969143e-09, "loss": 1.1264, "step": 32559 }, { "epoch": 0.98, "learning_rate": 4.7966001439189724e-09, "loss": 1.0706, "step": 32560 }, { "epoch": 0.98, "learning_rate": 4.78150945128153e-09, "loss": 1.1646, "step": 32561 }, { "epoch": 0.98, "learning_rate": 4.76644251192232e-09, "loss": 1.1857, "step": 32562 }, { "epoch": 0.98, "learning_rate": 4.751399325984563e-09, "loss": 0.9002, "step": 32563 }, { "epoch": 0.98, "learning_rate": 4.736379893612031e-09, "loss": 1.0148, "step": 32564 }, { "epoch": 0.98, "learning_rate": 4.721384214947388e-09, "loss": 1.0192, "step": 32565 }, { "epoch": 0.98, "learning_rate": 4.7064122901332995e-09, "loss": 1.0419, "step": 32566 }, { "epoch": 0.98, "learning_rate": 4.691464119312428e-09, "loss": 1.0366, "step": 32567 }, { "epoch": 0.98, "learning_rate": 4.676539702626881e-09, "loss": 1.0931, "step": 32568 }, { "epoch": 0.98, "learning_rate": 4.661639040219046e-09, "loss": 1.139, "step": 32569 }, { "epoch": 0.98, "learning_rate": 4.646762132230753e-09, "loss": 1.0704, "step": 32570 }, { "epoch": 0.98, "learning_rate": 4.631908978803279e-09, "loss": 1.0095, "step": 32571 }, { "epoch": 0.98, "learning_rate": 4.617079580078176e-09, "loss": 1.0514, "step": 32572 }, { "epoch": 0.98, "learning_rate": 4.602273936196721e-09, "loss": 1.1299, "step": 32573 }, { "epoch": 0.98, "learning_rate": 4.5874920472996355e-09, "loss": 1.1273, "step": 32574 }, { "epoch": 0.98, "learning_rate": 4.572733913528193e-09, "loss": 1.0112, "step": 32575 }, { "epoch": 0.98, "learning_rate": 4.557999535022284e-09, "loss": 1.0216, "step": 32576 }, { "epoch": 0.98, "learning_rate": 4.543288911922072e-09, "loss": 1.0455, "step": 32577 }, { "epoch": 0.98, "learning_rate": 4.52860204436828e-09, "loss": 1.1057, "step": 32578 }, { "epoch": 0.98, "learning_rate": 4.513938932500239e-09, "loss": 0.9619, "step": 32579 }, { "epoch": 0.98, "learning_rate": 4.499299576457561e-09, "loss": 1.0167, "step": 32580 }, { "epoch": 0.98, "learning_rate": 4.4846839763798554e-09, "loss": 1.1088, "step": 32581 }, { "epoch": 0.98, "learning_rate": 4.470092132405901e-09, "loss": 1.1568, "step": 32582 }, { "epoch": 0.98, "learning_rate": 4.455524044674753e-09, "loss": 1.1051, "step": 32583 }, { "epoch": 0.98, "learning_rate": 4.440979713325189e-09, "loss": 1.0437, "step": 32584 }, { "epoch": 0.98, "learning_rate": 4.426459138495709e-09, "loss": 1.1271, "step": 32585 }, { "epoch": 0.98, "learning_rate": 4.411962320324259e-09, "loss": 1.0916, "step": 32586 }, { "epoch": 0.98, "learning_rate": 4.397489258949061e-09, "loss": 0.9971, "step": 32587 }, { "epoch": 0.98, "learning_rate": 4.383039954507784e-09, "loss": 1.0444, "step": 32588 }, { "epoch": 0.98, "learning_rate": 4.368614407138094e-09, "loss": 1.0005, "step": 32589 }, { "epoch": 0.98, "learning_rate": 4.354212616977382e-09, "loss": 1.1541, "step": 32590 }, { "epoch": 0.98, "learning_rate": 4.339834584162484e-09, "loss": 1.0985, "step": 32591 }, { "epoch": 0.98, "learning_rate": 4.3254803088305095e-09, "loss": 1.0259, "step": 32592 }, { "epoch": 0.98, "learning_rate": 4.311149791118019e-09, "loss": 1.126, "step": 32593 }, { "epoch": 0.98, "learning_rate": 4.296843031161291e-09, "loss": 1.0098, "step": 32594 }, { "epoch": 0.98, "learning_rate": 4.2825600290966055e-09, "loss": 1.1636, "step": 32595 }, { "epoch": 0.98, "learning_rate": 4.268300785060242e-09, "loss": 1.1236, "step": 32596 }, { "epoch": 0.98, "learning_rate": 4.254065299187371e-09, "loss": 1.0424, "step": 32597 }, { "epoch": 0.98, "learning_rate": 4.239853571613994e-09, "loss": 1.0413, "step": 32598 }, { "epoch": 0.98, "learning_rate": 4.225665602475004e-09, "loss": 1.0682, "step": 32599 }, { "epoch": 0.98, "learning_rate": 4.211501391905848e-09, "loss": 1.1567, "step": 32600 }, { "epoch": 0.98, "learning_rate": 4.1973609400411395e-09, "loss": 1.068, "step": 32601 }, { "epoch": 0.98, "learning_rate": 4.1832442470154945e-09, "loss": 1.1434, "step": 32602 }, { "epoch": 0.98, "learning_rate": 4.169151312963526e-09, "loss": 1.1478, "step": 32603 }, { "epoch": 0.98, "learning_rate": 4.155082138019018e-09, "loss": 1.0905, "step": 32604 }, { "epoch": 0.98, "learning_rate": 4.141036722316027e-09, "loss": 1.0401, "step": 32605 }, { "epoch": 0.98, "learning_rate": 4.127015065988338e-09, "loss": 1.1451, "step": 32606 }, { "epoch": 0.98, "learning_rate": 4.113017169169453e-09, "loss": 1.0205, "step": 32607 }, { "epoch": 0.98, "learning_rate": 4.0990430319928774e-09, "loss": 1.0353, "step": 32608 }, { "epoch": 0.98, "learning_rate": 4.085092654591005e-09, "loss": 1.0972, "step": 32609 }, { "epoch": 0.98, "learning_rate": 4.071166037097063e-09, "loss": 1.1974, "step": 32610 }, { "epoch": 0.98, "learning_rate": 4.057263179643445e-09, "loss": 1.0593, "step": 32611 }, { "epoch": 0.98, "learning_rate": 4.043384082362545e-09, "loss": 1.1821, "step": 32612 }, { "epoch": 0.98, "learning_rate": 4.029528745386757e-09, "loss": 1.297, "step": 32613 }, { "epoch": 0.98, "learning_rate": 4.015697168847643e-09, "loss": 1.0175, "step": 32614 }, { "epoch": 0.98, "learning_rate": 4.001889352877042e-09, "loss": 0.9843, "step": 32615 }, { "epoch": 0.98, "learning_rate": 3.988105297606515e-09, "loss": 1.1321, "step": 32616 }, { "epoch": 0.98, "learning_rate": 3.97434500316679e-09, "loss": 1.0825, "step": 32617 }, { "epoch": 0.98, "learning_rate": 3.9606084696894305e-09, "loss": 1.0781, "step": 32618 }, { "epoch": 0.98, "learning_rate": 3.946895697304609e-09, "loss": 1.0476, "step": 32619 }, { "epoch": 0.98, "learning_rate": 3.933206686143332e-09, "loss": 1.0308, "step": 32620 }, { "epoch": 0.98, "learning_rate": 3.91954143633605e-09, "loss": 1.0921, "step": 32621 }, { "epoch": 0.98, "learning_rate": 3.905899948012382e-09, "loss": 1.0678, "step": 32622 }, { "epoch": 0.98, "learning_rate": 3.8922822213022235e-09, "loss": 1.1912, "step": 32623 }, { "epoch": 0.98, "learning_rate": 3.8786882563354725e-09, "loss": 1.1833, "step": 32624 }, { "epoch": 0.98, "learning_rate": 3.8651180532414675e-09, "loss": 1.303, "step": 32625 }, { "epoch": 0.98, "learning_rate": 3.851571612149551e-09, "loss": 1.061, "step": 32626 }, { "epoch": 0.98, "learning_rate": 3.838048933188232e-09, "loss": 1.0184, "step": 32627 }, { "epoch": 0.98, "learning_rate": 3.824550016486572e-09, "loss": 1.0865, "step": 32628 }, { "epoch": 0.98, "learning_rate": 3.811074862173081e-09, "loss": 1.1362, "step": 32629 }, { "epoch": 0.98, "learning_rate": 3.797623470375711e-09, "loss": 1.1071, "step": 32630 }, { "epoch": 0.98, "learning_rate": 3.784195841222971e-09, "loss": 1.1478, "step": 32631 }, { "epoch": 0.98, "learning_rate": 3.770791974842536e-09, "loss": 1.0986, "step": 32632 }, { "epoch": 0.98, "learning_rate": 3.757411871361804e-09, "loss": 1.0543, "step": 32633 }, { "epoch": 0.98, "learning_rate": 3.744055530908175e-09, "loss": 1.0584, "step": 32634 }, { "epoch": 0.98, "learning_rate": 3.730722953609045e-09, "loss": 1.1419, "step": 32635 }, { "epoch": 0.98, "learning_rate": 3.717414139591258e-09, "loss": 1.1889, "step": 32636 }, { "epoch": 0.98, "learning_rate": 3.704129088981101e-09, "loss": 0.972, "step": 32637 }, { "epoch": 0.98, "learning_rate": 3.6908678019056953e-09, "loss": 1.065, "step": 32638 }, { "epoch": 0.98, "learning_rate": 3.6776302784907737e-09, "loss": 1.0607, "step": 32639 }, { "epoch": 0.98, "learning_rate": 3.664416518862901e-09, "loss": 1.108, "step": 32640 }, { "epoch": 0.98, "learning_rate": 3.6512265231472554e-09, "loss": 1.0568, "step": 32641 }, { "epoch": 0.98, "learning_rate": 3.6380602914695695e-09, "loss": 1.1011, "step": 32642 }, { "epoch": 0.98, "learning_rate": 3.6249178239552987e-09, "loss": 1.1254, "step": 32643 }, { "epoch": 0.98, "learning_rate": 3.6117991207296197e-09, "loss": 1.0485, "step": 32644 }, { "epoch": 0.98, "learning_rate": 3.5987041819171565e-09, "loss": 1.1829, "step": 32645 }, { "epoch": 0.98, "learning_rate": 3.585633007642808e-09, "loss": 1.1196, "step": 32646 }, { "epoch": 0.98, "learning_rate": 3.57258559803092e-09, "loss": 1.1739, "step": 32647 }, { "epoch": 0.98, "learning_rate": 3.5595619532058368e-09, "loss": 1.1769, "step": 32648 }, { "epoch": 0.98, "learning_rate": 3.546562073291071e-09, "loss": 0.9977, "step": 32649 }, { "epoch": 0.98, "learning_rate": 3.5335859584109676e-09, "loss": 1.0135, "step": 32650 }, { "epoch": 0.98, "learning_rate": 3.5206336086887614e-09, "loss": 1.0948, "step": 32651 }, { "epoch": 0.98, "learning_rate": 3.5077050242476872e-09, "loss": 1.1271, "step": 32652 }, { "epoch": 0.98, "learning_rate": 3.49480020521098e-09, "loss": 1.0814, "step": 32653 }, { "epoch": 0.98, "learning_rate": 3.4819191517013182e-09, "loss": 1.1174, "step": 32654 }, { "epoch": 0.98, "learning_rate": 3.4690618638416605e-09, "loss": 1.1843, "step": 32655 }, { "epoch": 0.98, "learning_rate": 3.4562283417538535e-09, "loss": 1.0983, "step": 32656 }, { "epoch": 0.98, "learning_rate": 3.443418585560576e-09, "loss": 0.9296, "step": 32657 }, { "epoch": 0.98, "learning_rate": 3.4306325953833985e-09, "loss": 1.0596, "step": 32658 }, { "epoch": 0.98, "learning_rate": 3.417870371344445e-09, "loss": 1.0571, "step": 32659 }, { "epoch": 0.98, "learning_rate": 3.4051319135647297e-09, "loss": 1.1896, "step": 32660 }, { "epoch": 0.98, "learning_rate": 3.3924172221658225e-09, "loss": 1.1899, "step": 32661 }, { "epoch": 0.98, "learning_rate": 3.3797262972687372e-09, "loss": 1.1158, "step": 32662 }, { "epoch": 0.98, "learning_rate": 3.367059138994211e-09, "loss": 1.09, "step": 32663 }, { "epoch": 0.98, "learning_rate": 3.35441574746298e-09, "loss": 1.2325, "step": 32664 }, { "epoch": 0.98, "learning_rate": 3.3417961227952268e-09, "loss": 1.0806, "step": 32665 }, { "epoch": 0.98, "learning_rate": 3.329200265111132e-09, "loss": 0.9831, "step": 32666 }, { "epoch": 0.98, "learning_rate": 3.3166281745306004e-09, "loss": 1.1553, "step": 32667 }, { "epoch": 0.98, "learning_rate": 3.3040798511732585e-09, "loss": 1.1967, "step": 32668 }, { "epoch": 0.98, "learning_rate": 3.2915552951587326e-09, "loss": 1.09, "step": 32669 }, { "epoch": 0.98, "learning_rate": 3.2790545066060943e-09, "loss": 1.0671, "step": 32670 }, { "epoch": 0.98, "learning_rate": 3.2665774856344144e-09, "loss": 1.0367, "step": 32671 }, { "epoch": 0.98, "learning_rate": 3.2541242323624878e-09, "loss": 1.054, "step": 32672 }, { "epoch": 0.98, "learning_rate": 3.24169474690883e-09, "loss": 1.1054, "step": 32673 }, { "epoch": 0.98, "learning_rate": 3.22928902939168e-09, "loss": 1.0978, "step": 32674 }, { "epoch": 0.98, "learning_rate": 3.216907079929277e-09, "loss": 1.0309, "step": 32675 }, { "epoch": 0.98, "learning_rate": 3.2045488986393037e-09, "loss": 1.0515, "step": 32676 }, { "epoch": 0.98, "learning_rate": 3.1922144856397217e-09, "loss": 1.1605, "step": 32677 }, { "epoch": 0.98, "learning_rate": 3.1799038410473826e-09, "loss": 1.1091, "step": 32678 }, { "epoch": 0.98, "learning_rate": 3.167616964980247e-09, "loss": 1.2257, "step": 32679 }, { "epoch": 0.98, "learning_rate": 3.155353857554888e-09, "loss": 1.0551, "step": 32680 }, { "epoch": 0.98, "learning_rate": 3.14311451888788e-09, "loss": 1.0538, "step": 32681 }, { "epoch": 0.98, "learning_rate": 3.1308989490957953e-09, "loss": 1.0955, "step": 32682 }, { "epoch": 0.98, "learning_rate": 3.118707148295208e-09, "loss": 1.1013, "step": 32683 }, { "epoch": 0.98, "learning_rate": 3.1065391166018586e-09, "loss": 1.0082, "step": 32684 }, { "epoch": 0.98, "learning_rate": 3.094394854131766e-09, "loss": 1.0777, "step": 32685 }, { "epoch": 0.98, "learning_rate": 3.0822743610003926e-09, "loss": 1.0446, "step": 32686 }, { "epoch": 0.98, "learning_rate": 3.0701776373234794e-09, "loss": 1.1489, "step": 32687 }, { "epoch": 0.98, "learning_rate": 3.058104683215657e-09, "loss": 1.0818, "step": 32688 }, { "epoch": 0.98, "learning_rate": 3.046055498792111e-09, "loss": 1.1526, "step": 32689 }, { "epoch": 0.98, "learning_rate": 3.0340300841677496e-09, "loss": 1.027, "step": 32690 }, { "epoch": 0.98, "learning_rate": 3.022028439456648e-09, "loss": 1.0894, "step": 32691 }, { "epoch": 0.98, "learning_rate": 3.0100505647734368e-09, "loss": 1.1348, "step": 32692 }, { "epoch": 0.98, "learning_rate": 2.9980964602316364e-09, "loss": 1.2909, "step": 32693 }, { "epoch": 0.98, "learning_rate": 2.9861661259456e-09, "loss": 1.0248, "step": 32694 }, { "epoch": 0.98, "learning_rate": 2.9742595620285696e-09, "loss": 1.1171, "step": 32695 }, { "epoch": 0.98, "learning_rate": 2.9623767685940665e-09, "loss": 1.1752, "step": 32696 }, { "epoch": 0.98, "learning_rate": 2.950517745755055e-09, "loss": 1.1448, "step": 32697 }, { "epoch": 0.99, "learning_rate": 2.9386824936245005e-09, "loss": 1.0889, "step": 32698 }, { "epoch": 0.99, "learning_rate": 2.926871012315091e-09, "loss": 1.0824, "step": 32699 }, { "epoch": 0.99, "learning_rate": 2.9150833019392365e-09, "loss": 1.1677, "step": 32700 }, { "epoch": 0.99, "learning_rate": 2.9033193626090694e-09, "loss": 1.0873, "step": 32701 }, { "epoch": 0.99, "learning_rate": 2.891579194436722e-09, "loss": 1.1024, "step": 32702 }, { "epoch": 0.99, "learning_rate": 2.8798627975340498e-09, "loss": 1.1747, "step": 32703 }, { "epoch": 0.99, "learning_rate": 2.8681701720123523e-09, "loss": 1.123, "step": 32704 }, { "epoch": 0.99, "learning_rate": 2.8565013179829295e-09, "loss": 1.0046, "step": 32705 }, { "epoch": 0.99, "learning_rate": 2.8448562355568033e-09, "loss": 1.1218, "step": 32706 }, { "epoch": 0.99, "learning_rate": 2.833234924845274e-09, "loss": 0.9737, "step": 32707 }, { "epoch": 0.99, "learning_rate": 2.821637385958531e-09, "loss": 1.1271, "step": 32708 }, { "epoch": 0.99, "learning_rate": 2.8100636190070418e-09, "loss": 0.98, "step": 32709 }, { "epoch": 0.99, "learning_rate": 2.7985136241012732e-09, "loss": 1.0897, "step": 32710 }, { "epoch": 0.99, "learning_rate": 2.7869874013505826e-09, "loss": 1.1155, "step": 32711 }, { "epoch": 0.99, "learning_rate": 2.775484950865437e-09, "loss": 1.1077, "step": 32712 }, { "epoch": 0.99, "learning_rate": 2.7640062727549155e-09, "loss": 1.0744, "step": 32713 }, { "epoch": 0.99, "learning_rate": 2.752551367128098e-09, "loss": 1.0507, "step": 32714 }, { "epoch": 0.99, "learning_rate": 2.7411202340946186e-09, "loss": 1.0537, "step": 32715 }, { "epoch": 0.99, "learning_rate": 2.7297128737627245e-09, "loss": 0.9501, "step": 32716 }, { "epoch": 0.99, "learning_rate": 2.718329286241217e-09, "loss": 1.2564, "step": 32717 }, { "epoch": 0.99, "learning_rate": 2.706969471638621e-09, "loss": 1.1821, "step": 32718 }, { "epoch": 0.99, "learning_rate": 2.695633430062905e-09, "loss": 1.1156, "step": 32719 }, { "epoch": 0.99, "learning_rate": 2.6843211616220386e-09, "loss": 1.1915, "step": 32720 }, { "epoch": 0.99, "learning_rate": 2.6730326664234364e-09, "loss": 1.0839, "step": 32721 }, { "epoch": 0.99, "learning_rate": 2.6617679445750664e-09, "loss": 1.1377, "step": 32722 }, { "epoch": 0.99, "learning_rate": 2.6505269961840663e-09, "loss": 1.1266, "step": 32723 }, { "epoch": 0.99, "learning_rate": 2.6393098213570168e-09, "loss": 1.1127, "step": 32724 }, { "epoch": 0.99, "learning_rate": 2.6281164202010545e-09, "loss": 1.0921, "step": 32725 }, { "epoch": 0.99, "learning_rate": 2.6169467928224835e-09, "loss": 1.0608, "step": 32726 }, { "epoch": 0.99, "learning_rate": 2.605800939327885e-09, "loss": 1.0396, "step": 32727 }, { "epoch": 0.99, "learning_rate": 2.5946788598235627e-09, "loss": 1.0038, "step": 32728 }, { "epoch": 0.99, "learning_rate": 2.583580554414711e-09, "loss": 1.1472, "step": 32729 }, { "epoch": 0.99, "learning_rate": 2.5725060232076326e-09, "loss": 1.1957, "step": 32730 }, { "epoch": 0.99, "learning_rate": 2.5614552663072447e-09, "loss": 1.1996, "step": 32731 }, { "epoch": 0.99, "learning_rate": 2.550428283819295e-09, "loss": 1.1118, "step": 32732 }, { "epoch": 0.99, "learning_rate": 2.5394250758481454e-09, "loss": 1.1401, "step": 32733 }, { "epoch": 0.99, "learning_rate": 2.528445642498989e-09, "loss": 1.1232, "step": 32734 }, { "epoch": 0.99, "learning_rate": 2.5174899838764646e-09, "loss": 1.0806, "step": 32735 }, { "epoch": 0.99, "learning_rate": 2.5065581000840998e-09, "loss": 1.1951, "step": 32736 }, { "epoch": 0.99, "learning_rate": 2.4956499912268117e-09, "loss": 1.1475, "step": 32737 }, { "epoch": 0.99, "learning_rate": 2.484765657408128e-09, "loss": 1.1766, "step": 32738 }, { "epoch": 0.99, "learning_rate": 2.473905098731577e-09, "loss": 1.0806, "step": 32739 }, { "epoch": 0.99, "learning_rate": 2.46306831530041e-09, "loss": 0.9979, "step": 32740 }, { "epoch": 0.99, "learning_rate": 2.4522553072181543e-09, "loss": 1.1201, "step": 32741 }, { "epoch": 0.99, "learning_rate": 2.4414660745875064e-09, "loss": 1.0072, "step": 32742 }, { "epoch": 0.99, "learning_rate": 2.4307006175111614e-09, "loss": 1.2632, "step": 32743 }, { "epoch": 0.99, "learning_rate": 2.419958936091815e-09, "loss": 1.0059, "step": 32744 }, { "epoch": 0.99, "learning_rate": 2.4092410304316085e-09, "loss": 1.1726, "step": 32745 }, { "epoch": 0.99, "learning_rate": 2.3985469006324036e-09, "loss": 1.0747, "step": 32746 }, { "epoch": 0.99, "learning_rate": 2.3878765467963414e-09, "loss": 1.0398, "step": 32747 }, { "epoch": 0.99, "learning_rate": 2.3772299690247302e-09, "loss": 1.1367, "step": 32748 }, { "epoch": 0.99, "learning_rate": 2.366607167418877e-09, "loss": 1.1457, "step": 32749 }, { "epoch": 0.99, "learning_rate": 2.356008142080091e-09, "loss": 1.0748, "step": 32750 }, { "epoch": 0.99, "learning_rate": 2.345432893109123e-09, "loss": 1.0067, "step": 32751 }, { "epoch": 0.99, "learning_rate": 2.3348814206067273e-09, "loss": 1.0923, "step": 32752 }, { "epoch": 0.99, "learning_rate": 2.3243537246733783e-09, "loss": 1.0444, "step": 32753 }, { "epoch": 0.99, "learning_rate": 2.3138498054092738e-09, "loss": 1.1155, "step": 32754 }, { "epoch": 0.99, "learning_rate": 2.3033696629146116e-09, "loss": 1.223, "step": 32755 }, { "epoch": 0.99, "learning_rate": 2.292913297288757e-09, "loss": 1.2086, "step": 32756 }, { "epoch": 0.99, "learning_rate": 2.2824807086313517e-09, "loss": 0.9819, "step": 32757 }, { "epoch": 0.99, "learning_rate": 2.272071897041761e-09, "loss": 1.0792, "step": 32758 }, { "epoch": 0.99, "learning_rate": 2.26168686261935e-09, "loss": 1.0242, "step": 32759 }, { "epoch": 0.99, "learning_rate": 2.2513256054623734e-09, "loss": 0.9921, "step": 32760 }, { "epoch": 0.99, "learning_rate": 2.240988125670196e-09, "loss": 1.0677, "step": 32761 }, { "epoch": 0.99, "learning_rate": 2.2306744233405176e-09, "loss": 1.1472, "step": 32762 }, { "epoch": 0.99, "learning_rate": 2.220384498572148e-09, "loss": 1.065, "step": 32763 }, { "epoch": 0.99, "learning_rate": 2.210118351462509e-09, "loss": 1.0328, "step": 32764 }, { "epoch": 0.99, "learning_rate": 2.199875982109856e-09, "loss": 1.2087, "step": 32765 }, { "epoch": 0.99, "learning_rate": 2.189657390611055e-09, "loss": 1.0804, "step": 32766 }, { "epoch": 0.99, "learning_rate": 2.1794625770638068e-09, "loss": 1.0328, "step": 32767 }, { "epoch": 0.99, "learning_rate": 2.1692915415652547e-09, "loss": 1.0096, "step": 32768 }, { "epoch": 0.99, "learning_rate": 2.1591442842119893e-09, "loss": 1.0526, "step": 32769 }, { "epoch": 0.99, "learning_rate": 2.149020805100599e-09, "loss": 1.1413, "step": 32770 }, { "epoch": 0.99, "learning_rate": 2.138921104327396e-09, "loss": 1.1548, "step": 32771 }, { "epoch": 0.99, "learning_rate": 2.12884518198897e-09, "loss": 1.0594, "step": 32772 }, { "epoch": 0.99, "learning_rate": 2.1187930381807996e-09, "loss": 1.0617, "step": 32773 }, { "epoch": 0.99, "learning_rate": 2.108764672998642e-09, "loss": 1.1303, "step": 32774 }, { "epoch": 0.99, "learning_rate": 2.0987600865379767e-09, "loss": 1.2361, "step": 32775 }, { "epoch": 0.99, "learning_rate": 2.088779278894004e-09, "loss": 0.9827, "step": 32776 }, { "epoch": 0.99, "learning_rate": 2.078822250161927e-09, "loss": 1.1492, "step": 32777 }, { "epoch": 0.99, "learning_rate": 2.068889000436669e-09, "loss": 1.089, "step": 32778 }, { "epoch": 0.99, "learning_rate": 2.0589795298123214e-09, "loss": 1.1031, "step": 32779 }, { "epoch": 0.99, "learning_rate": 2.0490938383832537e-09, "loss": 1.0451, "step": 32780 }, { "epoch": 0.99, "learning_rate": 2.039231926244112e-09, "loss": 0.9561, "step": 32781 }, { "epoch": 0.99, "learning_rate": 2.0293937934881548e-09, "loss": 1.0874, "step": 32782 }, { "epoch": 0.99, "learning_rate": 2.0195794402094737e-09, "loss": 1.0676, "step": 32783 }, { "epoch": 0.99, "learning_rate": 2.0097888665013276e-09, "loss": 1.1261, "step": 32784 }, { "epoch": 0.99, "learning_rate": 2.0000220724566977e-09, "loss": 1.0959, "step": 32785 }, { "epoch": 0.99, "learning_rate": 1.99027905816912e-09, "loss": 1.0768, "step": 32786 }, { "epoch": 0.99, "learning_rate": 1.9805598237307434e-09, "loss": 1.0234, "step": 32787 }, { "epoch": 0.99, "learning_rate": 1.9708643692345488e-09, "loss": 1.0037, "step": 32788 }, { "epoch": 0.99, "learning_rate": 1.961192694772407e-09, "loss": 1.0569, "step": 32789 }, { "epoch": 0.99, "learning_rate": 1.9515448004367443e-09, "loss": 1.0892, "step": 32790 }, { "epoch": 0.99, "learning_rate": 1.941920686319154e-09, "loss": 1.113, "step": 32791 }, { "epoch": 0.99, "learning_rate": 1.9323203525115076e-09, "loss": 1.0422, "step": 32792 }, { "epoch": 0.99, "learning_rate": 1.92274379910512e-09, "loss": 1.261, "step": 32793 }, { "epoch": 0.99, "learning_rate": 1.91319102619103e-09, "loss": 0.9921, "step": 32794 }, { "epoch": 0.99, "learning_rate": 1.9036620338602763e-09, "loss": 1.0803, "step": 32795 }, { "epoch": 0.99, "learning_rate": 1.8941568222033415e-09, "loss": 1.1416, "step": 32796 }, { "epoch": 0.99, "learning_rate": 1.8846753913109862e-09, "loss": 1.1434, "step": 32797 }, { "epoch": 0.99, "learning_rate": 1.8752177412734164e-09, "loss": 1.1588, "step": 32798 }, { "epoch": 0.99, "learning_rate": 1.86578387218056e-09, "loss": 1.0052, "step": 32799 }, { "epoch": 0.99, "learning_rate": 1.8563737841226226e-09, "loss": 1.0939, "step": 32800 }, { "epoch": 0.99, "learning_rate": 1.8469874771884222e-09, "loss": 1.0578, "step": 32801 }, { "epoch": 0.99, "learning_rate": 1.8376249514681644e-09, "loss": 1.0856, "step": 32802 }, { "epoch": 0.99, "learning_rate": 1.8282862070501118e-09, "loss": 1.0179, "step": 32803 }, { "epoch": 0.99, "learning_rate": 1.818971244023915e-09, "loss": 1.0359, "step": 32804 }, { "epoch": 0.99, "learning_rate": 1.8096800624778366e-09, "loss": 1.0449, "step": 32805 }, { "epoch": 0.99, "learning_rate": 1.8004126625006946e-09, "loss": 1.1094, "step": 32806 }, { "epoch": 0.99, "learning_rate": 1.7911690441801965e-09, "loss": 1.1449, "step": 32807 }, { "epoch": 0.99, "learning_rate": 1.7819492076046051e-09, "loss": 1.1735, "step": 32808 }, { "epoch": 0.99, "learning_rate": 1.772753152861628e-09, "loss": 1.0289, "step": 32809 }, { "epoch": 0.99, "learning_rate": 1.763580880038973e-09, "loss": 1.1125, "step": 32810 }, { "epoch": 0.99, "learning_rate": 1.7544323892237925e-09, "loss": 1.0915, "step": 32811 }, { "epoch": 0.99, "learning_rate": 1.7453076805032387e-09, "loss": 1.0774, "step": 32812 }, { "epoch": 0.99, "learning_rate": 1.736206753964187e-09, "loss": 1.0709, "step": 32813 }, { "epoch": 0.99, "learning_rate": 1.7271296096932344e-09, "loss": 1.0799, "step": 32814 }, { "epoch": 0.99, "learning_rate": 1.718076247776701e-09, "loss": 1.1234, "step": 32815 }, { "epoch": 0.99, "learning_rate": 1.7090466683009066e-09, "loss": 1.0687, "step": 32816 }, { "epoch": 0.99, "learning_rate": 1.7000408713516158e-09, "loss": 1.0125, "step": 32817 }, { "epoch": 0.99, "learning_rate": 1.691058857014871e-09, "loss": 1.0692, "step": 32818 }, { "epoch": 0.99, "learning_rate": 1.6821006253761596e-09, "loss": 1.1587, "step": 32819 }, { "epoch": 0.99, "learning_rate": 1.6731661765204133e-09, "loss": 1.1519, "step": 32820 }, { "epoch": 0.99, "learning_rate": 1.6642555105331192e-09, "loss": 0.986, "step": 32821 }, { "epoch": 0.99, "learning_rate": 1.6553686274986548e-09, "loss": 1.0167, "step": 32822 }, { "epoch": 0.99, "learning_rate": 1.6465055275019514e-09, "loss": 1.1545, "step": 32823 }, { "epoch": 0.99, "learning_rate": 1.637666210627109e-09, "loss": 1.2226, "step": 32824 }, { "epoch": 0.99, "learning_rate": 1.6288506769585044e-09, "loss": 1.0765, "step": 32825 }, { "epoch": 0.99, "learning_rate": 1.6200589265799594e-09, "loss": 1.1653, "step": 32826 }, { "epoch": 0.99, "learning_rate": 1.6112909595752958e-09, "loss": 1.1585, "step": 32827 }, { "epoch": 0.99, "learning_rate": 1.6025467760277802e-09, "loss": 1.1305, "step": 32828 }, { "epoch": 0.99, "learning_rate": 1.5938263760209571e-09, "loss": 1.0206, "step": 32829 }, { "epoch": 0.99, "learning_rate": 1.5851297596372605e-09, "loss": 0.9833, "step": 32830 }, { "epoch": 0.99, "learning_rate": 1.5764569269602348e-09, "loss": 1.0361, "step": 32831 }, { "epoch": 0.99, "learning_rate": 1.5678078780717587e-09, "loss": 1.0941, "step": 32832 }, { "epoch": 0.99, "learning_rate": 1.559182613054544e-09, "loss": 1.1262, "step": 32833 }, { "epoch": 0.99, "learning_rate": 1.5505811319907471e-09, "loss": 1.163, "step": 32834 }, { "epoch": 0.99, "learning_rate": 1.542003434962247e-09, "loss": 1.0958, "step": 32835 }, { "epoch": 0.99, "learning_rate": 1.5334495220503676e-09, "loss": 0.9916, "step": 32836 }, { "epoch": 0.99, "learning_rate": 1.5249193933367102e-09, "loss": 1.1051, "step": 32837 }, { "epoch": 0.99, "learning_rate": 1.5164130489025986e-09, "loss": 1.019, "step": 32838 }, { "epoch": 0.99, "learning_rate": 1.5079304888288015e-09, "loss": 1.1089, "step": 32839 }, { "epoch": 0.99, "learning_rate": 1.4994717131963654e-09, "loss": 1.0121, "step": 32840 }, { "epoch": 0.99, "learning_rate": 1.4910367220855038e-09, "loss": 1.113, "step": 32841 }, { "epoch": 0.99, "learning_rate": 1.4826255155767077e-09, "loss": 1.1696, "step": 32842 }, { "epoch": 0.99, "learning_rate": 1.4742380937499135e-09, "loss": 1.0948, "step": 32843 }, { "epoch": 0.99, "learning_rate": 1.465874456685057e-09, "loss": 1.1561, "step": 32844 }, { "epoch": 0.99, "learning_rate": 1.4575346044617966e-09, "loss": 1.1322, "step": 32845 }, { "epoch": 0.99, "learning_rate": 1.4492185371595135e-09, "loss": 0.9749, "step": 32846 }, { "epoch": 0.99, "learning_rate": 1.440926254857311e-09, "loss": 0.9479, "step": 32847 }, { "epoch": 0.99, "learning_rate": 1.4326577576340151e-09, "loss": 1.0287, "step": 32848 }, { "epoch": 0.99, "learning_rate": 1.4244130455684512e-09, "loss": 1.0435, "step": 32849 }, { "epoch": 0.99, "learning_rate": 1.416192118739168e-09, "loss": 1.0645, "step": 32850 }, { "epoch": 0.99, "learning_rate": 1.407994977224436e-09, "loss": 1.0635, "step": 32851 }, { "epoch": 0.99, "learning_rate": 1.3998216211022486e-09, "loss": 1.0594, "step": 32852 }, { "epoch": 0.99, "learning_rate": 1.391672050450321e-09, "loss": 1.0491, "step": 32853 }, { "epoch": 0.99, "learning_rate": 1.3835462653463693e-09, "loss": 1.0195, "step": 32854 }, { "epoch": 0.99, "learning_rate": 1.3754442658678314e-09, "loss": 1.1389, "step": 32855 }, { "epoch": 0.99, "learning_rate": 1.3673660520915899e-09, "loss": 1.1413, "step": 32856 }, { "epoch": 0.99, "learning_rate": 1.359311624094528e-09, "loss": 1.0491, "step": 32857 }, { "epoch": 0.99, "learning_rate": 1.3512809819532513e-09, "loss": 1.0213, "step": 32858 }, { "epoch": 0.99, "learning_rate": 1.3432741257446424e-09, "loss": 1.0526, "step": 32859 }, { "epoch": 0.99, "learning_rate": 1.3352910555447519e-09, "loss": 1.0887, "step": 32860 }, { "epoch": 0.99, "learning_rate": 1.327331771429352e-09, "loss": 1.0437, "step": 32861 }, { "epoch": 0.99, "learning_rate": 1.3193962734744935e-09, "loss": 1.2697, "step": 32862 }, { "epoch": 0.99, "learning_rate": 1.311484561755394e-09, "loss": 1.1853, "step": 32863 }, { "epoch": 0.99, "learning_rate": 1.3035966363475483e-09, "loss": 1.0664, "step": 32864 }, { "epoch": 0.99, "learning_rate": 1.2957324973261742e-09, "loss": 1.0668, "step": 32865 }, { "epoch": 0.99, "learning_rate": 1.2878921447659343e-09, "loss": 1.0996, "step": 32866 }, { "epoch": 0.99, "learning_rate": 1.280075578741491e-09, "loss": 1.048, "step": 32867 }, { "epoch": 0.99, "learning_rate": 1.2722827993275066e-09, "loss": 1.1638, "step": 32868 }, { "epoch": 0.99, "learning_rate": 1.2645138065978113e-09, "loss": 0.9456, "step": 32869 }, { "epoch": 0.99, "learning_rate": 1.2567686006265123e-09, "loss": 1.1543, "step": 32870 }, { "epoch": 0.99, "learning_rate": 1.2490471814874395e-09, "loss": 1.1736, "step": 32871 }, { "epoch": 0.99, "learning_rate": 1.2413495492538675e-09, "loss": 1.0098, "step": 32872 }, { "epoch": 0.99, "learning_rate": 1.233675703999071e-09, "loss": 1.0602, "step": 32873 }, { "epoch": 0.99, "learning_rate": 1.2260256457966025e-09, "loss": 1.1417, "step": 32874 }, { "epoch": 0.99, "learning_rate": 1.2183993747186263e-09, "loss": 1.2054, "step": 32875 }, { "epoch": 0.99, "learning_rate": 1.2107968908381395e-09, "loss": 1.1113, "step": 32876 }, { "epoch": 0.99, "learning_rate": 1.2032181942273068e-09, "loss": 1.1285, "step": 32877 }, { "epoch": 0.99, "learning_rate": 1.1956632849585703e-09, "loss": 1.0187, "step": 32878 }, { "epoch": 0.99, "learning_rate": 1.1881321631035393e-09, "loss": 1.1263, "step": 32879 }, { "epoch": 0.99, "learning_rate": 1.1806248287341004e-09, "loss": 0.9998, "step": 32880 }, { "epoch": 0.99, "learning_rate": 1.173141281921586e-09, "loss": 1.1085, "step": 32881 }, { "epoch": 0.99, "learning_rate": 1.1656815227373276e-09, "loss": 1.0099, "step": 32882 }, { "epoch": 0.99, "learning_rate": 1.1582455512521019e-09, "loss": 1.0617, "step": 32883 }, { "epoch": 0.99, "learning_rate": 1.1508333675372407e-09, "loss": 1.0092, "step": 32884 }, { "epoch": 0.99, "learning_rate": 1.1434449716626884e-09, "loss": 1.0851, "step": 32885 }, { "epoch": 0.99, "learning_rate": 1.1360803636992212e-09, "loss": 1.171, "step": 32886 }, { "epoch": 0.99, "learning_rate": 1.1287395437165061e-09, "loss": 1.1313, "step": 32887 }, { "epoch": 0.99, "learning_rate": 1.121422511785042e-09, "loss": 0.9343, "step": 32888 }, { "epoch": 0.99, "learning_rate": 1.1141292679739402e-09, "loss": 1.1863, "step": 32889 }, { "epoch": 0.99, "learning_rate": 1.1068598123528673e-09, "loss": 1.0486, "step": 32890 }, { "epoch": 0.99, "learning_rate": 1.0996141449909348e-09, "loss": 1.0574, "step": 32891 }, { "epoch": 0.99, "learning_rate": 1.0923922659569763e-09, "loss": 1.2819, "step": 32892 }, { "epoch": 0.99, "learning_rate": 1.085194175320381e-09, "loss": 1.0824, "step": 32893 }, { "epoch": 0.99, "learning_rate": 1.0780198731488723e-09, "loss": 1.0333, "step": 32894 }, { "epoch": 0.99, "learning_rate": 1.070869359511284e-09, "loss": 0.9579, "step": 32895 }, { "epoch": 0.99, "learning_rate": 1.06374263447534e-09, "loss": 1.0368, "step": 32896 }, { "epoch": 0.99, "learning_rate": 1.056639698109041e-09, "loss": 0.9908, "step": 32897 }, { "epoch": 0.99, "learning_rate": 1.049560550480111e-09, "loss": 1.0493, "step": 32898 }, { "epoch": 0.99, "learning_rate": 1.0425051916557182e-09, "loss": 1.0934, "step": 32899 }, { "epoch": 0.99, "learning_rate": 1.035473621703309e-09, "loss": 1.0508, "step": 32900 }, { "epoch": 0.99, "learning_rate": 1.0284658406894965e-09, "loss": 1.1174, "step": 32901 }, { "epoch": 0.99, "learning_rate": 1.0214818486811718e-09, "loss": 1.0583, "step": 32902 }, { "epoch": 0.99, "learning_rate": 1.0145216457446705e-09, "loss": 1.0852, "step": 32903 }, { "epoch": 0.99, "learning_rate": 1.007585231946606e-09, "loss": 1.109, "step": 32904 }, { "epoch": 0.99, "learning_rate": 1.0006726073527595e-09, "loss": 1.1584, "step": 32905 }, { "epoch": 0.99, "learning_rate": 9.937837720289112e-10, "loss": 1.1946, "step": 32906 }, { "epoch": 0.99, "learning_rate": 9.869187260405644e-10, "loss": 1.1096, "step": 32907 }, { "epoch": 0.99, "learning_rate": 9.800774694532223e-10, "loss": 1.0681, "step": 32908 }, { "epoch": 0.99, "learning_rate": 9.732600023321104e-10, "loss": 1.0684, "step": 32909 }, { "epoch": 0.99, "learning_rate": 9.664663247416218e-10, "loss": 1.1252, "step": 32910 }, { "epoch": 0.99, "learning_rate": 9.596964367472594e-10, "loss": 1.1495, "step": 32911 }, { "epoch": 0.99, "learning_rate": 9.529503384128612e-10, "loss": 1.0907, "step": 32912 }, { "epoch": 0.99, "learning_rate": 9.462280298025427e-10, "loss": 1.0656, "step": 32913 }, { "epoch": 0.99, "learning_rate": 9.395295109806967e-10, "loss": 1.0991, "step": 32914 }, { "epoch": 0.99, "learning_rate": 9.328547820111612e-10, "loss": 1.0484, "step": 32915 }, { "epoch": 0.99, "learning_rate": 9.262038429569408e-10, "loss": 1.0553, "step": 32916 }, { "epoch": 0.99, "learning_rate": 9.19576693881874e-10, "loss": 1.1709, "step": 32917 }, { "epoch": 0.99, "learning_rate": 9.12973334848688e-10, "loss": 1.035, "step": 32918 }, { "epoch": 0.99, "learning_rate": 9.063937659206656e-10, "loss": 1.1105, "step": 32919 }, { "epoch": 0.99, "learning_rate": 8.998379871599794e-10, "loss": 1.0562, "step": 32920 }, { "epoch": 0.99, "learning_rate": 8.933059986290793e-10, "loss": 1.0479, "step": 32921 }, { "epoch": 0.99, "learning_rate": 8.867978003906929e-10, "loss": 1.0377, "step": 32922 }, { "epoch": 0.99, "learning_rate": 8.803133925058827e-10, "loss": 1.2173, "step": 32923 }, { "epoch": 0.99, "learning_rate": 8.738527750370984e-10, "loss": 1.231, "step": 32924 }, { "epoch": 0.99, "learning_rate": 8.674159480456801e-10, "loss": 1.2141, "step": 32925 }, { "epoch": 0.99, "learning_rate": 8.610029115929674e-10, "loss": 1.1369, "step": 32926 }, { "epoch": 0.99, "learning_rate": 8.546136657397452e-10, "loss": 1.0313, "step": 32927 }, { "epoch": 0.99, "learning_rate": 8.482482105467982e-10, "loss": 1.0765, "step": 32928 }, { "epoch": 0.99, "learning_rate": 8.419065460751885e-10, "loss": 1.0853, "step": 32929 }, { "epoch": 0.99, "learning_rate": 8.355886723845908e-10, "loss": 1.1735, "step": 32930 }, { "epoch": 0.99, "learning_rate": 8.292945895357896e-10, "loss": 1.0782, "step": 32931 }, { "epoch": 0.99, "learning_rate": 8.230242975884595e-10, "loss": 1.0622, "step": 32932 }, { "epoch": 0.99, "learning_rate": 8.167777966025525e-10, "loss": 1.1707, "step": 32933 }, { "epoch": 0.99, "learning_rate": 8.105550866369105e-10, "loss": 1.0694, "step": 32934 }, { "epoch": 0.99, "learning_rate": 8.04356167751208e-10, "loss": 1.0637, "step": 32935 }, { "epoch": 0.99, "learning_rate": 7.981810400042867e-10, "loss": 1.0619, "step": 32936 }, { "epoch": 0.99, "learning_rate": 7.92029703455266e-10, "loss": 1.0787, "step": 32937 }, { "epoch": 0.99, "learning_rate": 7.859021581624327e-10, "loss": 1.08, "step": 32938 }, { "epoch": 0.99, "learning_rate": 7.797984041840733e-10, "loss": 1.1805, "step": 32939 }, { "epoch": 0.99, "learning_rate": 7.737184415781973e-10, "loss": 1.0162, "step": 32940 }, { "epoch": 0.99, "learning_rate": 7.676622704030912e-10, "loss": 1.104, "step": 32941 }, { "epoch": 0.99, "learning_rate": 7.61629890716209e-10, "loss": 1.1526, "step": 32942 }, { "epoch": 0.99, "learning_rate": 7.556213025747272e-10, "loss": 1.2235, "step": 32943 }, { "epoch": 0.99, "learning_rate": 7.496365060360999e-10, "loss": 1.1776, "step": 32944 }, { "epoch": 0.99, "learning_rate": 7.436755011572261e-10, "loss": 1.0201, "step": 32945 }, { "epoch": 0.99, "learning_rate": 7.377382879950046e-10, "loss": 1.0609, "step": 32946 }, { "epoch": 0.99, "learning_rate": 7.318248666057793e-10, "loss": 1.1028, "step": 32947 }, { "epoch": 0.99, "learning_rate": 7.259352370458939e-10, "loss": 1.1349, "step": 32948 }, { "epoch": 0.99, "learning_rate": 7.200693993714147e-10, "loss": 1.2382, "step": 32949 }, { "epoch": 0.99, "learning_rate": 7.142273536381306e-10, "loss": 1.1058, "step": 32950 }, { "epoch": 0.99, "learning_rate": 7.084090999018301e-10, "loss": 1.1109, "step": 32951 }, { "epoch": 0.99, "learning_rate": 7.026146382177467e-10, "loss": 1.121, "step": 32952 }, { "epoch": 0.99, "learning_rate": 6.968439686411144e-10, "loss": 1.0289, "step": 32953 }, { "epoch": 0.99, "learning_rate": 6.910970912266113e-10, "loss": 1.0922, "step": 32954 }, { "epoch": 0.99, "learning_rate": 6.853740060291936e-10, "loss": 1.0816, "step": 32955 }, { "epoch": 0.99, "learning_rate": 6.796747131035398e-10, "loss": 1.1216, "step": 32956 }, { "epoch": 0.99, "learning_rate": 6.739992125034956e-10, "loss": 1.1234, "step": 32957 }, { "epoch": 0.99, "learning_rate": 6.683475042831844e-10, "loss": 1.0356, "step": 32958 }, { "epoch": 0.99, "learning_rate": 6.627195884967297e-10, "loss": 1.0616, "step": 32959 }, { "epoch": 0.99, "learning_rate": 6.571154651971445e-10, "loss": 1.1823, "step": 32960 }, { "epoch": 0.99, "learning_rate": 6.515351344382747e-10, "loss": 1.2091, "step": 32961 }, { "epoch": 0.99, "learning_rate": 6.459785962731336e-10, "loss": 1.1525, "step": 32962 }, { "epoch": 0.99, "learning_rate": 6.404458507544565e-10, "loss": 1.0505, "step": 32963 }, { "epoch": 0.99, "learning_rate": 6.34936897934979e-10, "loss": 1.0203, "step": 32964 }, { "epoch": 0.99, "learning_rate": 6.294517378671594e-10, "loss": 0.9507, "step": 32965 }, { "epoch": 0.99, "learning_rate": 6.239903706031781e-10, "loss": 1.0104, "step": 32966 }, { "epoch": 0.99, "learning_rate": 6.185527961952153e-10, "loss": 1.1522, "step": 32967 }, { "epoch": 0.99, "learning_rate": 6.131390146948968e-10, "loss": 1.2462, "step": 32968 }, { "epoch": 0.99, "learning_rate": 6.077490261535702e-10, "loss": 1.1328, "step": 32969 }, { "epoch": 0.99, "learning_rate": 6.023828306228607e-10, "loss": 1.0892, "step": 32970 }, { "epoch": 0.99, "learning_rate": 5.970404281535613e-10, "loss": 1.0588, "step": 32971 }, { "epoch": 0.99, "learning_rate": 5.917218187967422e-10, "loss": 1.1003, "step": 32972 }, { "epoch": 0.99, "learning_rate": 5.86427002603196e-10, "loss": 1.162, "step": 32973 }, { "epoch": 0.99, "learning_rate": 5.811559796228827e-10, "loss": 1.1757, "step": 32974 }, { "epoch": 0.99, "learning_rate": 5.759087499063176e-10, "loss": 1.0225, "step": 32975 }, { "epoch": 0.99, "learning_rate": 5.706853135031831e-10, "loss": 1.1467, "step": 32976 }, { "epoch": 0.99, "learning_rate": 5.654856704634392e-10, "loss": 1.065, "step": 32977 }, { "epoch": 0.99, "learning_rate": 5.60309820836491e-10, "loss": 1.0529, "step": 32978 }, { "epoch": 0.99, "learning_rate": 5.551577646717432e-10, "loss": 1.0012, "step": 32979 }, { "epoch": 0.99, "learning_rate": 5.500295020180457e-10, "loss": 0.9911, "step": 32980 }, { "epoch": 0.99, "learning_rate": 5.449250329242484e-10, "loss": 1.1876, "step": 32981 }, { "epoch": 0.99, "learning_rate": 5.398443574389234e-10, "loss": 0.998, "step": 32982 }, { "epoch": 0.99, "learning_rate": 5.34787475610643e-10, "loss": 1.0225, "step": 32983 }, { "epoch": 0.99, "learning_rate": 5.297543874874245e-10, "loss": 1.1251, "step": 32984 }, { "epoch": 0.99, "learning_rate": 5.247450931170072e-10, "loss": 1.0544, "step": 32985 }, { "epoch": 0.99, "learning_rate": 5.197595925474086e-10, "loss": 1.1492, "step": 32986 }, { "epoch": 0.99, "learning_rate": 5.147978858258129e-10, "loss": 1.0798, "step": 32987 }, { "epoch": 0.99, "learning_rate": 5.098599729994047e-10, "loss": 1.084, "step": 32988 }, { "epoch": 0.99, "learning_rate": 5.049458541153684e-10, "loss": 1.0396, "step": 32989 }, { "epoch": 0.99, "learning_rate": 5.000555292206111e-10, "loss": 1.1268, "step": 32990 }, { "epoch": 0.99, "learning_rate": 4.951889983614844e-10, "loss": 1.1436, "step": 32991 }, { "epoch": 0.99, "learning_rate": 4.903462615843401e-10, "loss": 1.1479, "step": 32992 }, { "epoch": 0.99, "learning_rate": 4.855273189352527e-10, "loss": 1.1349, "step": 32993 }, { "epoch": 0.99, "learning_rate": 4.807321704602963e-10, "loss": 1.0587, "step": 32994 }, { "epoch": 0.99, "learning_rate": 4.759608162047125e-10, "loss": 1.118, "step": 32995 }, { "epoch": 0.99, "learning_rate": 4.712132562142979e-10, "loss": 1.1384, "step": 32996 }, { "epoch": 0.99, "learning_rate": 4.664894905340168e-10, "loss": 1.0479, "step": 32997 }, { "epoch": 0.99, "learning_rate": 4.6178951920911043e-10, "loss": 1.2314, "step": 32998 }, { "epoch": 0.99, "learning_rate": 4.5711334228398797e-10, "loss": 1.1695, "step": 32999 }, { "epoch": 0.99, "learning_rate": 4.5246095980361336e-10, "loss": 1.0592, "step": 33000 }, { "epoch": 0.99, "learning_rate": 4.478323718115629e-10, "loss": 1.2285, "step": 33001 }, { "epoch": 0.99, "learning_rate": 4.4322757835252304e-10, "loss": 1.0247, "step": 33002 }, { "epoch": 0.99, "learning_rate": 4.386465794703476e-10, "loss": 1.1958, "step": 33003 }, { "epoch": 0.99, "learning_rate": 4.340893752080577e-10, "loss": 1.056, "step": 33004 }, { "epoch": 0.99, "learning_rate": 4.2955596560978476e-10, "loss": 1.1659, "step": 33005 }, { "epoch": 0.99, "learning_rate": 4.250463507179947e-10, "loss": 1.2729, "step": 33006 }, { "epoch": 0.99, "learning_rate": 4.2056053057598636e-10, "loss": 1.1271, "step": 33007 }, { "epoch": 0.99, "learning_rate": 4.160985052265032e-10, "loss": 1.0479, "step": 33008 }, { "epoch": 0.99, "learning_rate": 4.1166027471173375e-10, "loss": 0.9899, "step": 33009 }, { "epoch": 0.99, "learning_rate": 4.072458390744216e-10, "loss": 1.1198, "step": 33010 }, { "epoch": 0.99, "learning_rate": 4.0285519835592256e-10, "loss": 1.0875, "step": 33011 }, { "epoch": 0.99, "learning_rate": 3.9848835259870264e-10, "loss": 1.2603, "step": 33012 }, { "epoch": 0.99, "learning_rate": 3.9414530184384016e-10, "loss": 1.0491, "step": 33013 }, { "epoch": 0.99, "learning_rate": 3.898260461329684e-10, "loss": 1.0337, "step": 33014 }, { "epoch": 0.99, "learning_rate": 3.8553058550688804e-10, "loss": 1.1464, "step": 33015 }, { "epoch": 0.99, "learning_rate": 3.8125892000695497e-10, "loss": 1.0603, "step": 33016 }, { "epoch": 0.99, "learning_rate": 3.770110496734147e-10, "loss": 1.0554, "step": 33017 }, { "epoch": 0.99, "learning_rate": 3.7278697454706803e-10, "loss": 1.2672, "step": 33018 }, { "epoch": 0.99, "learning_rate": 3.685866946678829e-10, "loss": 1.0544, "step": 33019 }, { "epoch": 0.99, "learning_rate": 3.6441021007582733e-10, "loss": 1.0002, "step": 33020 }, { "epoch": 0.99, "learning_rate": 3.6025752081059184e-10, "loss": 1.1223, "step": 33021 }, { "epoch": 0.99, "learning_rate": 3.561286269118669e-10, "loss": 1.118, "step": 33022 }, { "epoch": 0.99, "learning_rate": 3.5202352841906537e-10, "loss": 1.068, "step": 33023 }, { "epoch": 0.99, "learning_rate": 3.479422253710452e-10, "loss": 1.1216, "step": 33024 }, { "epoch": 0.99, "learning_rate": 3.43884717806664e-10, "loss": 1.0424, "step": 33025 }, { "epoch": 0.99, "learning_rate": 3.398510057647797e-10, "loss": 1.1321, "step": 33026 }, { "epoch": 0.99, "learning_rate": 3.35841089283695e-10, "loss": 1.1277, "step": 33027 }, { "epoch": 0.99, "learning_rate": 3.3185496840143496e-10, "loss": 1.1323, "step": 33028 }, { "epoch": 0.99, "learning_rate": 3.2789264315602477e-10, "loss": 1.1749, "step": 33029 }, { "epoch": 1.0, "learning_rate": 3.2395411358521203e-10, "loss": 1.243, "step": 33030 }, { "epoch": 1.0, "learning_rate": 3.2003937972618915e-10, "loss": 1.2122, "step": 33031 }, { "epoch": 1.0, "learning_rate": 3.161484416169813e-10, "loss": 1.0864, "step": 33032 }, { "epoch": 1.0, "learning_rate": 3.1228129929394834e-10, "loss": 1.0714, "step": 33033 }, { "epoch": 1.0, "learning_rate": 3.084379527940051e-10, "loss": 1.1368, "step": 33034 }, { "epoch": 1.0, "learning_rate": 3.0461840215378903e-10, "loss": 1.0422, "step": 33035 }, { "epoch": 1.0, "learning_rate": 3.008226474099374e-10, "loss": 0.9588, "step": 33036 }, { "epoch": 1.0, "learning_rate": 2.970506885982549e-10, "loss": 1.1442, "step": 33037 }, { "epoch": 1.0, "learning_rate": 2.9330252575482386e-10, "loss": 1.0621, "step": 33038 }, { "epoch": 1.0, "learning_rate": 2.8957815891517136e-10, "loss": 1.0429, "step": 33039 }, { "epoch": 1.0, "learning_rate": 2.858775881148246e-10, "loss": 0.9027, "step": 33040 }, { "epoch": 1.0, "learning_rate": 2.8220081338903306e-10, "loss": 1.1396, "step": 33041 }, { "epoch": 1.0, "learning_rate": 2.785478347727688e-10, "loss": 1.1773, "step": 33042 }, { "epoch": 1.0, "learning_rate": 2.7491865230072636e-10, "loss": 1.1185, "step": 33043 }, { "epoch": 1.0, "learning_rate": 2.713132660078777e-10, "loss": 1.0284, "step": 33044 }, { "epoch": 1.0, "learning_rate": 2.67731675927807e-10, "loss": 1.1274, "step": 33045 }, { "epoch": 1.0, "learning_rate": 2.641738820952089e-10, "loss": 1.1525, "step": 33046 }, { "epoch": 1.0, "learning_rate": 2.606398845439451e-10, "loss": 1.0217, "step": 33047 }, { "epoch": 1.0, "learning_rate": 2.5712968330704466e-10, "loss": 1.2305, "step": 33048 }, { "epoch": 1.0, "learning_rate": 2.5364327841864713e-10, "loss": 1.15, "step": 33049 }, { "epoch": 1.0, "learning_rate": 2.501806699117815e-10, "loss": 1.2404, "step": 33050 }, { "epoch": 1.0, "learning_rate": 2.467418578189218e-10, "loss": 1.1283, "step": 33051 }, { "epoch": 1.0, "learning_rate": 2.433268421733748e-10, "loss": 1.0721, "step": 33052 }, { "epoch": 1.0, "learning_rate": 2.3993562300733685e-10, "loss": 0.9764, "step": 33053 }, { "epoch": 1.0, "learning_rate": 2.365682003532821e-10, "loss": 1.0529, "step": 33054 }, { "epoch": 1.0, "learning_rate": 2.332245742431294e-10, "loss": 1.031, "step": 33055 }, { "epoch": 1.0, "learning_rate": 2.2990474470879765e-10, "loss": 1.0429, "step": 33056 }, { "epoch": 1.0, "learning_rate": 2.2660871178192822e-10, "loss": 1.0901, "step": 33057 }, { "epoch": 1.0, "learning_rate": 2.2333647549360738e-10, "loss": 1.1597, "step": 33058 }, { "epoch": 1.0, "learning_rate": 2.2008803587519888e-10, "loss": 1.0881, "step": 33059 }, { "epoch": 1.0, "learning_rate": 2.1686339295778903e-10, "loss": 1.0688, "step": 33060 }, { "epoch": 1.0, "learning_rate": 2.1366254677163135e-10, "loss": 1.018, "step": 33061 }, { "epoch": 1.0, "learning_rate": 2.104854973478121e-10, "loss": 1.2083, "step": 33062 }, { "epoch": 1.0, "learning_rate": 2.0733224471602974e-10, "loss": 1.0297, "step": 33063 }, { "epoch": 1.0, "learning_rate": 2.0420278890653787e-10, "loss": 1.1017, "step": 33064 }, { "epoch": 1.0, "learning_rate": 2.0109712994903497e-10, "loss": 1.0924, "step": 33065 }, { "epoch": 1.0, "learning_rate": 1.9801526787321946e-10, "loss": 1.1724, "step": 33066 }, { "epoch": 1.0, "learning_rate": 1.949572027082347e-10, "loss": 1.1212, "step": 33067 }, { "epoch": 1.0, "learning_rate": 1.9192293448322407e-10, "loss": 1.1407, "step": 33068 }, { "epoch": 1.0, "learning_rate": 1.8891246322733092e-10, "loss": 1.104, "step": 33069 }, { "epoch": 1.0, "learning_rate": 1.859257889691435e-10, "loss": 1.1549, "step": 33070 }, { "epoch": 1.0, "learning_rate": 1.8296291173697244e-10, "loss": 1.097, "step": 33071 }, { "epoch": 1.0, "learning_rate": 1.8002383155885094e-10, "loss": 1.097, "step": 33072 }, { "epoch": 1.0, "learning_rate": 1.7710854846308966e-10, "loss": 1.0566, "step": 33073 }, { "epoch": 1.0, "learning_rate": 1.7421706247716662e-10, "loss": 0.9356, "step": 33074 }, { "epoch": 1.0, "learning_rate": 1.713493736288374e-10, "loss": 1.0332, "step": 33075 }, { "epoch": 1.0, "learning_rate": 1.6850548194530249e-10, "loss": 1.0674, "step": 33076 }, { "epoch": 1.0, "learning_rate": 1.6568538745376229e-10, "loss": 1.0486, "step": 33077 }, { "epoch": 1.0, "learning_rate": 1.6288909018058464e-10, "loss": 1.0601, "step": 33078 }, { "epoch": 1.0, "learning_rate": 1.6011659015297e-10, "loss": 1.1611, "step": 33079 }, { "epoch": 1.0, "learning_rate": 1.5736788739728613e-10, "loss": 0.9528, "step": 33080 }, { "epoch": 1.0, "learning_rate": 1.5464298193906825e-10, "loss": 1.2121, "step": 33081 }, { "epoch": 1.0, "learning_rate": 1.5194187380496162e-10, "loss": 1.058, "step": 33082 }, { "epoch": 1.0, "learning_rate": 1.492645630205014e-10, "loss": 1.1078, "step": 33083 }, { "epoch": 1.0, "learning_rate": 1.4661104961066764e-10, "loss": 1.0491, "step": 33084 }, { "epoch": 1.0, "learning_rate": 1.4398133360155052e-10, "loss": 1.0687, "step": 33085 }, { "epoch": 1.0, "learning_rate": 1.41375415017575e-10, "loss": 1.1108, "step": 33086 }, { "epoch": 1.0, "learning_rate": 1.387932938837211e-10, "loss": 1.0651, "step": 33087 }, { "epoch": 1.0, "learning_rate": 1.3623497022441368e-10, "loss": 1.1031, "step": 33088 }, { "epoch": 1.0, "learning_rate": 1.3370044406435523e-10, "loss": 1.0941, "step": 33089 }, { "epoch": 1.0, "learning_rate": 1.3118971542741553e-10, "loss": 1.1021, "step": 33090 }, { "epoch": 1.0, "learning_rate": 1.2870278433774196e-10, "loss": 1.1927, "step": 33091 }, { "epoch": 1.0, "learning_rate": 1.262396508186492e-10, "loss": 1.2183, "step": 33092 }, { "epoch": 1.0, "learning_rate": 1.2380031489400702e-10, "loss": 1.0851, "step": 33093 }, { "epoch": 1.0, "learning_rate": 1.2138477658657498e-10, "loss": 1.1129, "step": 33094 }, { "epoch": 1.0, "learning_rate": 1.1899303591966783e-10, "loss": 1.1331, "step": 33095 }, { "epoch": 1.0, "learning_rate": 1.1662509291604506e-10, "loss": 1.1087, "step": 33096 }, { "epoch": 1.0, "learning_rate": 1.142809475979112e-10, "loss": 1.0806, "step": 33097 }, { "epoch": 1.0, "learning_rate": 1.1196059998802578e-10, "loss": 1.1583, "step": 33098 }, { "epoch": 1.0, "learning_rate": 1.096640501083157e-10, "loss": 0.9465, "step": 33099 }, { "epoch": 1.0, "learning_rate": 1.0739129798070792e-10, "loss": 1.0785, "step": 33100 }, { "epoch": 1.0, "learning_rate": 1.0514234362657417e-10, "loss": 1.1268, "step": 33101 }, { "epoch": 1.0, "learning_rate": 1.0291718706756382e-10, "loss": 1.1449, "step": 33102 }, { "epoch": 1.0, "learning_rate": 1.0071582832449356e-10, "loss": 1.0773, "step": 33103 }, { "epoch": 1.0, "learning_rate": 9.853826741901274e-11, "loss": 1.1072, "step": 33104 }, { "epoch": 1.0, "learning_rate": 9.638450437138291e-11, "loss": 1.1156, "step": 33105 }, { "epoch": 1.0, "learning_rate": 9.425453920186567e-11, "loss": 1.0998, "step": 33106 }, { "epoch": 1.0, "learning_rate": 9.214837193155524e-11, "loss": 1.0825, "step": 33107 }, { "epoch": 1.0, "learning_rate": 9.006600257960296e-11, "loss": 1.0976, "step": 33108 }, { "epoch": 1.0, "learning_rate": 8.800743116627042e-11, "loss": 1.1541, "step": 33109 }, { "epoch": 1.0, "learning_rate": 8.597265771126406e-11, "loss": 1.096, "step": 33110 }, { "epoch": 1.0, "learning_rate": 8.396168223373524e-11, "loss": 1.1036, "step": 33111 }, { "epoch": 1.0, "learning_rate": 8.19745047528353e-11, "loss": 1.1827, "step": 33112 }, { "epoch": 1.0, "learning_rate": 8.00111252877156e-11, "loss": 0.9734, "step": 33113 }, { "epoch": 1.0, "learning_rate": 7.807154385669479e-11, "loss": 1.1946, "step": 33114 }, { "epoch": 1.0, "learning_rate": 7.615576047836914e-11, "loss": 0.9805, "step": 33115 }, { "epoch": 1.0, "learning_rate": 7.426377517133488e-11, "loss": 1.0746, "step": 33116 }, { "epoch": 1.0, "learning_rate": 7.239558795307799e-11, "loss": 1.1457, "step": 33117 }, { "epoch": 1.0, "learning_rate": 7.055119884163964e-11, "loss": 1.1096, "step": 33118 }, { "epoch": 1.0, "learning_rate": 6.87306078545058e-11, "loss": 1.1057, "step": 33119 }, { "epoch": 1.0, "learning_rate": 6.693381500916252e-11, "loss": 1.1655, "step": 33120 }, { "epoch": 1.0, "learning_rate": 6.516082032254067e-11, "loss": 1.1645, "step": 33121 }, { "epoch": 1.0, "learning_rate": 6.341162381157118e-11, "loss": 0.972, "step": 33122 }, { "epoch": 1.0, "learning_rate": 6.168622549290737e-11, "loss": 1.0839, "step": 33123 }, { "epoch": 1.0, "learning_rate": 5.998462538292504e-11, "loss": 1.1168, "step": 33124 }, { "epoch": 1.0, "learning_rate": 5.830682349799999e-11, "loss": 1.0378, "step": 33125 }, { "epoch": 1.0, "learning_rate": 5.665281985395288e-11, "loss": 1.0155, "step": 33126 }, { "epoch": 1.0, "learning_rate": 5.502261446632684e-11, "loss": 1.0825, "step": 33127 }, { "epoch": 1.0, "learning_rate": 5.341620735122011e-11, "loss": 1.1794, "step": 33128 }, { "epoch": 1.0, "learning_rate": 5.183359852334313e-11, "loss": 1.1109, "step": 33129 }, { "epoch": 1.0, "learning_rate": 5.027478799796148e-11, "loss": 1.0938, "step": 33130 }, { "epoch": 1.0, "learning_rate": 4.873977579006317e-11, "loss": 0.9793, "step": 33131 }, { "epoch": 1.0, "learning_rate": 4.722856191435865e-11, "loss": 1.1646, "step": 33132 }, { "epoch": 1.0, "learning_rate": 4.574114638472571e-11, "loss": 1.0902, "step": 33133 }, { "epoch": 1.0, "learning_rate": 4.427752921559725e-11, "loss": 1.0601, "step": 33134 }, { "epoch": 1.0, "learning_rate": 4.283771042112861e-11, "loss": 1.1811, "step": 33135 }, { "epoch": 1.0, "learning_rate": 4.142169001464247e-11, "loss": 1.2047, "step": 33136 }, { "epoch": 1.0, "learning_rate": 4.0029468010016614e-11, "loss": 1.1036, "step": 33137 }, { "epoch": 1.0, "learning_rate": 3.866104442001861e-11, "loss": 1.0632, "step": 33138 }, { "epoch": 1.0, "learning_rate": 3.731641925824869e-11, "loss": 1.1048, "step": 33139 }, { "epoch": 1.0, "learning_rate": 3.599559253691931e-11, "loss": 1.1401, "step": 33140 }, { "epoch": 1.0, "learning_rate": 3.4698564269075583e-11, "loss": 1.081, "step": 33141 }, { "epoch": 1.0, "learning_rate": 3.3425334466652413e-11, "loss": 1.1409, "step": 33142 }, { "epoch": 1.0, "learning_rate": 3.217590314213981e-11, "loss": 1.2343, "step": 33143 }, { "epoch": 1.0, "learning_rate": 3.0950270307472664e-11, "loss": 1.1107, "step": 33144 }, { "epoch": 1.0, "learning_rate": 2.9748435973753206e-11, "loss": 1.0673, "step": 33145 }, { "epoch": 1.0, "learning_rate": 2.85704001531939e-11, "loss": 0.9727, "step": 33146 }, { "epoch": 1.0, "learning_rate": 2.7416162856341855e-11, "loss": 1.0475, "step": 33147 }, { "epoch": 1.0, "learning_rate": 2.628572409457686e-11, "loss": 1.1937, "step": 33148 }, { "epoch": 1.0, "learning_rate": 2.517908387844603e-11, "loss": 1.2767, "step": 33149 }, { "epoch": 1.0, "learning_rate": 2.409624221849649e-11, "loss": 1.1508, "step": 33150 }, { "epoch": 1.0, "learning_rate": 2.3037199125275354e-11, "loss": 1.0529, "step": 33151 }, { "epoch": 1.0, "learning_rate": 2.2001954608774634e-11, "loss": 1.0743, "step": 33152 }, { "epoch": 1.0, "learning_rate": 2.0990508678708778e-11, "loss": 1.0549, "step": 33153 }, { "epoch": 1.0, "learning_rate": 2.0002861344792233e-11, "loss": 1.2216, "step": 33154 }, { "epoch": 1.0, "learning_rate": 1.9039012616461904e-11, "loss": 1.148, "step": 33155 }, { "epoch": 1.0, "learning_rate": 1.809896250259957e-11, "loss": 1.1783, "step": 33156 }, { "epoch": 1.0, "learning_rate": 1.7182711012642128e-11, "loss": 1.08, "step": 33157 }, { "epoch": 1.0, "learning_rate": 1.6290258155193804e-11, "loss": 1.0224, "step": 33158 }, { "epoch": 1.0, "learning_rate": 1.5421603938303718e-11, "loss": 1.0767, "step": 33159 }, { "epoch": 1.0, "learning_rate": 1.4576748370853655e-11, "loss": 1.0325, "step": 33160 }, { "epoch": 1.0, "learning_rate": 1.3755691460337617e-11, "loss": 1.0644, "step": 33161 }, { "epoch": 1.0, "learning_rate": 1.2958433215082278e-11, "loss": 1.2864, "step": 33162 }, { "epoch": 1.0, "learning_rate": 1.2184973642304088e-11, "loss": 1.0948, "step": 33163 }, { "epoch": 1.0, "learning_rate": 1.1435312749497052e-11, "loss": 1.0555, "step": 33164 }, { "epoch": 1.0, "learning_rate": 1.070945054387762e-11, "loss": 1.1112, "step": 33165 }, { "epoch": 1.0, "learning_rate": 1.000738703210713e-11, "loss": 1.1691, "step": 33166 }, { "epoch": 1.0, "learning_rate": 9.329122221124476e-12, "loss": 1.0519, "step": 33167 }, { "epoch": 1.0, "learning_rate": 8.67465611731344e-12, "loss": 1.0447, "step": 33168 }, { "epoch": 1.0, "learning_rate": 8.04398872678025e-12, "loss": 1.0714, "step": 33169 }, { "epoch": 1.0, "learning_rate": 7.437120055631131e-12, "loss": 1.0355, "step": 33170 }, { "epoch": 1.0, "learning_rate": 6.854050109694754e-12, "loss": 0.9724, "step": 33171 }, { "epoch": 1.0, "learning_rate": 6.294778894522236e-12, "loss": 1.0798, "step": 33172 }, { "epoch": 1.0, "learning_rate": 5.759306415387134e-12, "loss": 1.0808, "step": 33173 }, { "epoch": 1.0, "learning_rate": 5.247632677285452e-12, "loss": 1.0862, "step": 33174 }, { "epoch": 1.0, "learning_rate": 4.7597576852131956e-12, "loss": 1.0765, "step": 33175 }, { "epoch": 1.0, "learning_rate": 4.29568144388881e-12, "loss": 1.0955, "step": 33176 }, { "epoch": 1.0, "learning_rate": 3.855403957475634e-12, "loss": 0.932, "step": 33177 }, { "epoch": 1.0, "learning_rate": 3.438925230414558e-12, "loss": 1.0955, "step": 33178 }, { "epoch": 1.0, "learning_rate": 3.0462452665913633e-12, "loss": 1.2332, "step": 33179 }, { "epoch": 1.0, "learning_rate": 2.6773640696142744e-12, "loss": 1.018, "step": 33180 }, { "epoch": 1.0, "learning_rate": 2.3322816430915163e-12, "loss": 1.024, "step": 33181 }, { "epoch": 1.0, "learning_rate": 2.010997990631314e-12, "loss": 1.1562, "step": 33182 }, { "epoch": 1.0, "learning_rate": 1.7135131147316687e-12, "loss": 1.1175, "step": 33183 }, { "epoch": 1.0, "learning_rate": 1.439827018445694e-12, "loss": 1.0069, "step": 33184 }, { "epoch": 1.0, "learning_rate": 1.189939704548948e-12, "loss": 1.0455, "step": 33185 }, { "epoch": 1.0, "learning_rate": 9.638511752618762e-13, "loss": 1.2671, "step": 33186 }, { "epoch": 1.0, "learning_rate": 7.615614325273691e-13, "loss": 1.2811, "step": 33187 }, { "epoch": 1.0, "learning_rate": 5.830704788434283e-13, "loss": 1.2257, "step": 33188 }, { "epoch": 1.0, "learning_rate": 4.2837831532027697e-13, "loss": 1.047, "step": 33189 }, { "epoch": 1.0, "learning_rate": 2.974849439008054e-13, "loss": 1.0248, "step": 33190 }, { "epoch": 1.0, "learning_rate": 1.9039036541768086e-13, "loss": 1.1207, "step": 33191 }, { "epoch": 1.0, "learning_rate": 1.0709458125868211e-13, "loss": 1.1119, "step": 33192 }, { "epoch": 1.0, "learning_rate": 4.759759170136491e-14, "loss": 1.1302, "step": 33193 }, { "epoch": 1.0, "learning_rate": 1.1899397855952288e-14, "loss": 1.1273, "step": 33194 }, { "epoch": 1.0, "learning_rate": 0.0, "loss": 1.1128, "step": 33195 }, { "epoch": 1.0, "step": 33195, "total_flos": 7183881258045440.0, "train_loss": 1.1314439481955585, "train_runtime": 84160.343, "train_samples_per_second": 12.621, "train_steps_per_second": 0.394 } ], "max_steps": 33195, "num_train_epochs": 1, "total_flos": 7183881258045440.0, "trial_name": null, "trial_params": null }